diff --git a/.gitattributes b/.gitattributes index c7d9f3332a950355d5a77d85000f05e6f45435ea..b9d26a58c1b864f6cf5c4bf349a5c4202e060c61 100644 --- a/.gitattributes +++ b/.gitattributes @@ -32,3 +32,99 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..408cb29485788ff10bf5e2ebe9d98042e31c6139 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4177738397053596, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.052439714987504826}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07401331365029154, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001555945380008501}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.309544677126812, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004598258018956965}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11313553204694117, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020976821294602234}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03523505191827857, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009392296781654515}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.15329454407408277, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003251728201432321}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05411413548524944, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013020734544028827}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07061132409656197, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014031957668770357}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.30042353738636374, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0044778245769371994}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10845705136602556, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019284471387199143}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07049851230067716, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001450359178267902}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.296810156480222, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0043631335921961835}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10792394253569278, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019640770726289487}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..9e3865700cc6167a468b96626bda374055b3519c --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5808615724978651, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03393350967485746}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08183691647303251, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015166625147494993}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.40093348191479217, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005450906036616762}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12727475120836446, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002035424606741712}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.039062153239498784, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009349863984338872}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20112348772170943, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003804920107675235}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.06096091447803779, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012946551599852026}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07650521343895433, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013445352921906551}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.37517446453693076, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004982125783681737}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1192836731407637, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001834016996545526}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07726225443418276, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001411238354454551}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3769882191273612, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004973103856227287}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.12012804167712486, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018942369664582516}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a59264400f1a2bb9c20e13322d883d950efc0106 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6974388179157304, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.030575587628070142}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08378329306693072, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001459322065449314}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4295176674907729, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005387840357836537}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.13158075248220336, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019778747548532725}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03959861804048329, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008790815089921375}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21857768529907604, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003978406350005915}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.06253675704279393, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012350283375229683}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.0765488634109198, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001262760988042247}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3942968542813885, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004825967992749896}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.12041670906511595, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001724997794417473}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07912745617089588, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013596543752117662}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.40482037642139057, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004938559564217245}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.12422716343042028, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018397851260800163}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..76173ee63ba292c4ff68c0f1d7ef89c7f18d6e2c --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.8278535585588646, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04101323263962433}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08547615960283327, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014631064392462048}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.45233724476476256, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005498610961440376}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.13488847581723404, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019541441973022983}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.04064020009202515, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009117668832831653}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.23147273606302815, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004055355768121839}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.06437212669435428, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012436500824994457}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07766706751152817, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012705151561288445}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.4116826372221156, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004846073095478439}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.12265416975642841, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001687981425852585}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.08067112264899551, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013779713860748017}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.42508315288079185, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005020947504999342}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.12722726363829323, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018316120685934315}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..5c562d780fba04a26eb221fa4121b41c7bd16419 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.8696996582752973, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06098328946071962}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0846654378867452, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014210010721050707}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4578457479151435, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005514991901446975}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1345378611428427, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019444813188940376}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03959585063348627, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000862580003329711}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2318178313336565, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0041148040681156135}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.06331896436631664, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012304846406140408}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07578970344610945, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011783081782238954}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.4122041018783002, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004808418678515961}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1206116472621873, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001620078997028922}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0796291662268957, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001316435535538898}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.43058423280412716, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005076088365482536}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.12652519308473198, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018015979293605463}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..5dcf4ffa579ee20c54094f4a125058bd8e6ea747 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.9386565201757037, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.044526839780327905}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08665394421115923, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013765101453522592}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.479351769718965, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00548474489542107}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.13836362229996832, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001893431540140422}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.04073112194630253, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008342579281972372}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.24709583361079115, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004288275564287053}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.06552803780701107, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001201220687887674}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07688627300671028, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011617752110929672}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.4288123063878505, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004826731215989172}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.12284158062218388, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015900050300239478}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.08154653189712766, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001288193874235195}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.4505990363238062, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.005059301966187745}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1301416572009741, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001768541697398853}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..38d009039fcea4c958053d6c0c4002bbb727c3da --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.13997262682188616, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018152662704601968}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.23988301526777517, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026425508349757127}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.16422245329729376, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018151110735496203}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.02739555088551612, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007299475693711506}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04882561093577656, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0013519389814047277}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03235069293218825, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008205093824111827}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10940153468767774, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012797812738055785}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.19392296248486443, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021299443087579575}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1298012454573935, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013082389095494423}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.12920003480420952, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016583776510762952}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.22237769560119033, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002445338658648684}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15178310664024564, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016581127885119964}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.4010466021962698, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05693469656785709}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..2457b231e418a9ab0a0897c0eee4d335c80fac76 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.19237806407108246, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002156616087328965}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.3212993636930355, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002829724921518021}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.22176158764199283, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019496812102440851}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04730550033705585, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010038562816699207}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0810126790953652, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016920263323925329}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05436564304591471, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010398581680374484}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.13189452873558555, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014440357444886517}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.22728266255319154, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021740082956540176}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15298606072602197, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001269522698605816}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1799760146194542, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002013284357082607}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.3015175800896575, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026743484362997554}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.20773701812397452, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018267476451028011}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.6792767534985105, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08050348994884776}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..54c0770799b0118e0862b57ac0b4f19a5c9c7aa6 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.19587403318777896, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002246482935330373}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.3104623013424553, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026357716525505985}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.21881031202295378, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018340980892655135}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.049518456494770303, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001177357025652893}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.07843155253080596, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016707411483431178}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05407980043809886, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010322675581464652}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.13795120173138903, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001669101235947338}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.22381109650316425, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002115149596829255}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15447333837028793, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012811266282334365}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.18399939129198817, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021107295487964614}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2924275031032992, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024986416120394883}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.20577620783096848, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017206650892505897}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.825588151177289, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0827483173505062}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..03bbf5a562201eea752899b5ebf5fef6a4e2e9ff --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1647227013547415, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0024792520261390483}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2560613183847905, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0032797831033041618}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17955806504481292, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002195205258030929}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.040393011250336536, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001120492765195676}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06579426072456108, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001694481658818446}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04429422701774445, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010178187766663955}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11737676404806478, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018604626033532456}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1856490443924171, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00253379229574718}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12746828061030624, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015396980890683188}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.15523651118051682, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0023598380194680005}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.24112578036228802, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0030888339817801563}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1689495507422565, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020580481966186253}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.77140298721746, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09911601058676267}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..0f618c4fa6fcc7618b7dfa06edb3bc46dc52fda9 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.053177399565422716, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001969539589668854}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.08460445332976693, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002887654568198146}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.05724507901787019, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001923136290184156}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.012859547969705542, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000726325510216138}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.02237244864266085, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012034662851936587}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.014128667931700438, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0006962023161566057}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.03993285011532237, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014928569276828109}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.06466228514995502, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022622950372018576}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.042868526761057124, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014217476738280137}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.05008717864701033, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018614454895917413}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.07995227312474681, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027408841913450226}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.053934021939145045, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018135115805431904}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.6374428010243339, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04679817619985886}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..5b640a58ffd36cabb79d2af01b9f1dfb4bc1accb --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.009250162353650573, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0009501892043502089}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.01399225543923628, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0013479443593293063}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.009409482800898775, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008719922868900455}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0025132950634529213, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0003496566473256293}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.003986174570934941, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0005228969007076435}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0024954950292378434, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00030758521273803235}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.006939530851512524, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.000721287497804254}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.010674568197211812, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0010578455964358668}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.007016931130854418, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006474630715093982}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.008770387592628782, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0008958471929010777}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.013287426441297979, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0012768296011753365}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.008928183444317063, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0008250504967685091}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5497714003816197e-06, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 2.826544891292017e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..1ef8c0f91e00e65d0b9c59b3c310b5e48d4d4ce8 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.01707387064925112, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.004548339499332125}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.01479209987025161, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0003848187529004132}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.02647907855108807, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0007373776368265799}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.01833385014011665, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0004556651351480112}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.00018468533574224637, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 3.7035782299895355e-05}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.00032184358555587336, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 6.80865158511292e-05}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.00022602188070215841, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 4.551736869387828e-05}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.014749675627827365, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0003794521861304636}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.02642067669572227, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0007319703340695989}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.01828543709345876, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.000449785707890762}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.01381746395527955, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0003369009463365385}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.024406964608590324, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0005979225418060756}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.017042834318925764, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00038117023392555423}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..4ff76d50102e4bc178fee6e88369c3332d5eefb6 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.199945366026236, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09740891554529413}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5190142019208609, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003327240390036289}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4114616078138066, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030408033259645612}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.43361162405107295, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024498717646033665}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.24092206705754915, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025432949505695425}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.18797583914402394, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002107165588256214}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.1983453767330724, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019553142654631156}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3810297781145268, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002955659050147338}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.2982904326283383, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002441126924534855}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.315514252090379, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020950130049756485}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4272477194499663, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031895534936824997}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.33692836067640447, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027567274786219256}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3556790279405754, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023552583830999735}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..ad8b1b2f239c88547407124fcf8f7932bd640a49 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.752880813365183, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.22532887560628184}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5483859178177682, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003284509279619272}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4329119599793277, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002935675677350969}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4576720641979181, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022953942764252673}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.26853962452756747, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002740945324943779}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.20828673845347298, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021908686840527536}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.22030084182668652, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020287670329249274}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.407475473407987, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0030181731331604795}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.31883364076878173, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002461630929460497}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.33784951726273604, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002092067006211518}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.45802173612428515, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003228180984559956}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3606321592898537, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002748101165505275}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.38152814100163385, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002318898465385505}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..9c8cf82ed497bf4e478241836a5f3cbf93cd5946 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.567475379286549, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1880502425341883}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.54296137339216, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032385304204834925}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4468637477572891, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002870747282334814}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.46365491542004894, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021794833674578123}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.268879550509031, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026847549706603357}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21872430008911764, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022357966811142774}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.22644283092674808, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020104468971516875}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.40563436021398125, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029671089231426426}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.33158522150890407, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024524778139217965}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3445418845511442, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002026802374084494}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.457618460997299, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003163617105952389}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.37651908361075154, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027495326994019364}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3905619856893357, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002253731478640236}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..1f11d68b28a7c4c733f1f188c4bd9640d76a40d0 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.740384950752064, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.17474565384186433}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.51943848236802, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031779058467164764}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4567820792568219, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002851642014055284}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4606344386510922, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021643969739297475}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.25737502763838105, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026242680468160895}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2245153764885056, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022588441708384973}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.22570040278921377, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020088114026586526}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3876917725288397, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028653337007260647}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3397952534482862, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024656674082997676}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3427780842217158, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020244481019983177}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.43916794242095064, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030589422127270337}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3876015303869884, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027798320723785553}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3902532373292503, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022482737601443}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ead2d2d5820671aedc873af8a55327406a20c425 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.772366014464684, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1727094167530513}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4849957590476985, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0029633904151518614}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4698079682696499, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028147920332754844}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.45315037221898985, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002063099268846445}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.23597412151168465, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0023313187461128483}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22775944680052645, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002217444405292992}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2186838500921512, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018776056949733047}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.36121121776556825, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002645618381599165}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3483500842464673, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024310911003668787}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.33617919401288165, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019141754215681863}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.41312019009298706, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0028317325884933}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.40082494576214567, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027213945607275796}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3862609489154149, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021169304456593015}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_0.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..fea6af4e8680c6124cb4821f95e339ff7466d027 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1636017883690539, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0024265639944645607}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3135411100199371, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004414059386580781}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20406385886176096, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00258155674612985}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03326860572215188, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013712483892843969}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06935361806518704, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002630864064398201}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.042825803126534195, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00160599002891498}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.12376190274002842, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019110587602701528}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23856624379837527, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034515198934126907}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.154429756081877, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019969002281278216}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.12670301550297952, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001984240932547222}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2456847137827434, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0037888888942200177}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1585898458477123, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021649602354550605}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.7916845418214005, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07828212807526311}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_1.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..b2402a98e09f3980c1634e4bd6058c50326119fb --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12258398799437052, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017962630199380857}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3012382161995991, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004139509463692997}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17216405786002645, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002413004919727933}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.022923096739945113, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009396939072749053}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.058554066932389494, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002474769338098033}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.032550109418001044, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013323022688404391}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0953766892949565, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013021773787458971}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2362381442835074, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0031828562476237457}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13422605654232356, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017698404507476406}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09729740585688308, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001433871342903216}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24153880156299268, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003500903202746728}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13702592659449045, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019551406042742046}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.3135114346532981, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08463533356367237}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_2.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..83acaba8e5231ce8362c58b1b5b1b8b0e7949d59 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12014057910525737, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00177027208032182}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2937362802990173, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0040558921767481415}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.16848679088873222, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023805185438281235}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.023037471663706975, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009651714294322547}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.05808812201139429, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002494816691771811}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.032592328628319726, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001360334296634944}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09796298255577943, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013818612760360376}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24059048844697575, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0032525841201501613}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13752060575301803, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018652017270717643}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09437688045356053, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014232755198755626}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23332253770052824, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0034512361504183474}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13274693169694082, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019432835336852861}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.2969951394913493, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06867031320524596}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_3.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ad2dfe5736cef6c33724aefa5b0c3834b92e69f1 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.11962719565205662, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002016131135992487}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2790081357700044, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0043060099015184835}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.16364844726335212, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002540088417740363}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02385360834922912, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000982041326291719}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.057563110969334454, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002474970323879015}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03286054820200277, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013434565504320645}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09886948142069724, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016489525812605937}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23196290924579455, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003657598924470169}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13539724940510672, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020807935996877674}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09403709487175377, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016315538581778424}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.22096634372218205, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0036039318241550657}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.12875250329964805, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020505398481043147}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.327235232469952, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09959209280385814}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_4.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..21e3115348c80d3b02a82597909fbd54e381e629 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.04098939178475802, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026204420208068035}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.07322660875950299, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0042459458791253716}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.04714699127177818, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002660932299544834}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.009005101634115067, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00121171937903932}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.016152720952389045, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015904264999107502}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.01002600655383815, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009249273635939417}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.034375344099908396, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002283572080585189}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.06037717457617166, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0035163081114451514}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.038851245646855916, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002177065038104623}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.03382829886719806, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002342085999586738}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.05845333975676655, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003459845391454891}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03782418886463528, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021755326176048475}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.720494287805737, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.13337005008364483}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_5.json b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..e757f83abe2727a8a630d3a73b9938edbb072986 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/agg.4b284b84bc4seed1_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0027818328091416475, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0007401612256325405}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.002330798812107932, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0006256804823539565}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.002482537431673434, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0006590331629581881}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0003101211896994361, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00012661794961734148}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0002680102915951972, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00011124280815470673}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.00028593668938742907, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00011751104642033578}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0020462530294442205, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0005534615847200946}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0017580325391528475, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0004906057300283716}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.001846067784976754, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0005022326643801285}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0025260844263122434, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0006786126789253857}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.002133328291896597, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.000585991073578324}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.002260942501090202, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0006097815513991564}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.437491909962072e-37, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 6.679183284996885e-31}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5a16ba0b7351a6777af53392bfa912f40730d8c9 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99edb5e425657b632e5da2c7d32afdd5cf707893ff589988d24c7cefe6d90bcf +size 4125601 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e166eee20d0316935b75a119a6e61937e74de71d --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ff72ebec179bdf6d382a18dd1de30ce0761e926f4488b1ed3aecee26b42426e +size 5100585 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..87503e7cf3fbe4ddd976330a03333aaf766f000d --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4920687f3d1bb673d3f6efc31075af23baec0729aa6a78b573e06ff00e54dd94 +size 6015964 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..bd6af78d506694fd475b014e61bd156adb794a4a --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee7f6f6e548f7ea6598e9df3f6b316eddaa83ecd5e98fca241b65d3a1c6e8174 +size 6943636 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..db4e957bbd7bf2c7fdd789c8a04c5be25c5ee91e --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44d8eed75b01a4e073859112df0d89d520b2670a3205d24f8fa49b8043819cda +size 7852923 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5b749e5d6224766452c8ab93b8885b32b9b1447c --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62334751617972b1b9637d7000b2a64af567c3d78dc88de106d71d57ba32259d +size 8766721 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5d925b30c5c2da759bd207ab82056ecb4344e82e --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed17e6663e67826f88690fde941a158e62e0ad4b3f27fe2cdbe615bcc74e89f8 +size 7677561 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..41dabc43b5460e50960e9866d86ec814ead285c0 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c212a086900c27d8dca4c5262bfbd47aa52809470b1452e7e18e7d553d8c7eef +size 13319402 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..52e23f0ff1afa1426629daa88a525e83b6f2473b --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f96b86323763ad7f24f8db81dde0b3fd117a9d86123eb2a10d70fd56b64ed763 +size 18911611 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1c2ef2bc7056d33f16aac686c120adbca8cf6742 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c91d5946a148cdc2309d44e9c7d934d5efdc136022c90b741b9fb47cc9409c7f +size 24330373 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e8b29e6a4be061d211eabdf75930ede8d36fcfe4 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:661e4befc115f0ae1284e84e85bc17ac685a7b9bc2b13aa21cccbe4a01791cce +size 29472600 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d7a134d7ef017ef4826425734e0f5ffefc8b1a64 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b813e22c15bf0f5f125dc233aae07c1a150e12cccddf7414e0fbfde2b7786cd +size 34799981 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..11c7a69e58c370f588652a3fe089e147c258fdfb --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:accfd1ac193f56e691948b0a55c1d228c53d5d90c92d11aea65a0a4d4938c5f0 +size 4503280 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..20618aef8cea5f71f6a1c4afb552fdf73352f3db --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce2f4a75463db4eeb1553a38ad6da60eec4768c814ccb1b3773a9226dbb0d27d +size 5029610 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..41609116a0de072096d47b57016a065a74d0cf39 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44084d17dcb56f22954ad5b1eb7adcbf8854947d17893349c954e2694920ea2e +size 6113880 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..364b71067430e753575ab6062007eb18f9f0e1b1 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cace0772644520668a4a48455f5039ba7b733e60286b4b5ed97e75b4403ac0b0 +size 7213616 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..513d2bf380a12b262c4ef770ae787dbb36df6d87 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38bd7d8c5227c9d898849736d3027a36e178a8c88543f671919e6d83e1e83a7e +size 8319346 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6f4755bb443534a528fe895088244ccf788f1762 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:561c4226b02ea7c525bcb7620defe409113a1fa0d4eefe73b2ae75df4b2db523 +size 9446609 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_0.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ba741bf9143b960e0a446d2d7d4ff1ef5d7cd117 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd241c8c157d77579e040fb4c4f00fbfe179d620cc0704b9e1fea0d915bca2a2 +size 2783414 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_1.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..46d2301144d77d316cdc3d40cf4ec42c99d2acff --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:600c083ddd8c7fa75a53741c1f8eefb41e5d0e461e45ae563a79b254ff179607 +size 5103114 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_2.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8b8fd9367bf9952523137cb58259a2f3d4a661e4 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe164d8c6f44ee56ba05adf8d1d8888f0bf6546ee5ff4b96b06ed822a8bba6ef +size 7378005 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_3.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..bb61c7f8bc3255b7c7e0a0ab1b676f26f1b73ba7 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f2c67451b761421f27bb6691de6ba91b44c4ab5f1aa25cd1bf96c5a5801b83e +size 9645216 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_4.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..95733773d61399911802d1f50ba278846dec8d91 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f98fda765bc56873b45400d8ade210dbb95f4a0a1aea15f200062ca94f0a6cc4 +size 11671985 diff --git a/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_5.jsonl b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7eed0466967070a07d404bfdcff5d67e3cb633d4 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/examples.4b284b84bc4seed1_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:378d7c4028216a73012e77c351e79ff1cbdfc417b6ffe16d006b62914137581d +size 13897469 diff --git a/4b284b84bc4seed1/evaluation/generation/merged.csv b/4b284b84bc4seed1/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..d3822863ba32a4badb24bb79c4ca8522adf879c7 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.00022602188070215841 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.00022602188070215841 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.1983453767330724 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.1983453767330724 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.22030084182668652 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.22030084182668652 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.22644283092674808 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.22644283092674808 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.22570040278921377 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.22570040278921377 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.2186838500921512 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.2186838500921512 +e2e_nlg_cleaned,5,average,multiple,0.181616554041429 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.042825803126534195 +gem_xsum,0,median,rouge2_fmeasure,0.042825803126534195 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.032550109418001044 +gem_xsum,1,median,rouge2_fmeasure,0.032550109418001044 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.032592328628319726 +gem_xsum,2,median,rouge2_fmeasure,0.032592328628319726 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.03286054820200277 +gem_xsum,3,median,rouge2_fmeasure,0.03286054820200277 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.01002600655383815 +gem_xsum,4,median,rouge2_fmeasure,0.01002600655383815 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.00028593668938742907 +gem_xsum,5,median,rouge2_fmeasure,0.00028593668938742907 +gem_xsum,5,average,multiple,0.025190122103013884 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.05411413548524944 +web_nlg_en,0,median,rouge2_fmeasure,0.05411413548524944 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.06096091447803779 +web_nlg_en,1,median,rouge2_fmeasure,0.06096091447803779 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.06253675704279393 +web_nlg_en,2,median,rouge2_fmeasure,0.06253675704279393 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.06437212669435428 +web_nlg_en,3,median,rouge2_fmeasure,0.06437212669435428 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.06331896436631664 +web_nlg_en,4,median,rouge2_fmeasure,0.06331896436631664 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.06552803780701107 +web_nlg_en,5,median,rouge2_fmeasure,0.06552803780701107 +web_nlg_en,5,average,multiple,0.061805155978960524 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.03235069293218825 +wiki_lingua_en,0,median,rouge2_fmeasure,0.03235069293218825 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.05436564304591471 +wiki_lingua_en,1,median,rouge2_fmeasure,0.05436564304591471 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.05407980043809886 +wiki_lingua_en,2,median,rouge2_fmeasure,0.05407980043809886 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.04429422701774445 +wiki_lingua_en,3,median,rouge2_fmeasure,0.04429422701774445 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.014128667931700438 +wiki_lingua_en,4,median,rouge2_fmeasure,0.014128667931700438 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0024954950292378434 +wiki_lingua_en,5,median,rouge2_fmeasure,0.0024954950292378434 +wiki_lingua_en,5,average,multiple,0.033619087732480755 diff --git a/4b284b84bc4seed1/evaluation/generation/merged.json b/4b284b84bc4seed1/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..fb2c308fbdfdc83b2101df344edeeb0fbdb45815 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.4177738397053596, "bleu_stderr": 0.052439714987504826, "rouge1_fmeasure": 0.11313553204694117, "rouge1_fmeasure_stderr": 0.0020976821294602234, "rouge1_precision": 0.07401331365029154, "rouge1_precision_stderr": 0.001555945380008501, "rouge1_recall": 0.309544677126812, "rouge1_recall_stderr": 0.004598258018956965, "rouge2_fmeasure": 0.05411413548524944, "rouge2_fmeasure_stderr": 0.0013020734544028827, "rouge2_precision": 0.03523505191827857, "rouge2_precision_stderr": 0.0009392296781654515, "rouge2_recall": 0.15329454407408277, "rouge2_recall_stderr": 0.003251728201432321, "rougeL_fmeasure": 0.10845705136602556, "rougeL_fmeasure_stderr": 0.0019284471387199143, "rougeL_precision": 0.07061132409656197, "rougeL_precision_stderr": 0.0014031957668770357, "rougeL_recall": 0.30042353738636374, "rougeL_recall_stderr": 0.0044778245769371994, "rougeLsum_fmeasure": 0.10792394253569278, "rougeLsum_fmeasure_stderr": 0.0019640770726289487, "rougeLsum_precision": 0.07049851230067716, "rougeLsum_precision_stderr": 0.001450359178267902, "rougeLsum_recall": 0.296810156480222, "rougeLsum_recall_stderr": 0.0043631335921961835}}, "1": {"PALM_prompt": {"bleu": 0.5808615724978651, "bleu_stderr": 0.03393350967485746, "rouge1_fmeasure": 0.12727475120836446, "rouge1_fmeasure_stderr": 0.002035424606741712, "rouge1_precision": 0.08183691647303251, "rouge1_precision_stderr": 0.0015166625147494993, "rouge1_recall": 0.40093348191479217, "rouge1_recall_stderr": 0.005450906036616762, "rouge2_fmeasure": 0.06096091447803779, "rouge2_fmeasure_stderr": 0.0012946551599852026, "rouge2_precision": 0.039062153239498784, "rouge2_precision_stderr": 0.0009349863984338872, "rouge2_recall": 0.20112348772170943, "rouge2_recall_stderr": 0.003804920107675235, "rougeL_fmeasure": 0.1192836731407637, "rougeL_fmeasure_stderr": 0.001834016996545526, "rougeL_precision": 0.07650521343895433, "rougeL_precision_stderr": 0.0013445352921906551, "rougeL_recall": 0.37517446453693076, "rougeL_recall_stderr": 0.004982125783681737, "rougeLsum_fmeasure": 0.12012804167712486, "rougeLsum_fmeasure_stderr": 0.0018942369664582516, "rougeLsum_precision": 0.07726225443418276, "rougeLsum_precision_stderr": 0.001411238354454551, "rougeLsum_recall": 0.3769882191273612, "rougeLsum_recall_stderr": 0.004973103856227287}}, "2": {"PALM_prompt": {"bleu": 0.6974388179157304, "bleu_stderr": 0.030575587628070142, "rouge1_fmeasure": 0.13158075248220336, "rouge1_fmeasure_stderr": 0.0019778747548532725, "rouge1_precision": 0.08378329306693072, "rouge1_precision_stderr": 0.001459322065449314, "rouge1_recall": 0.4295176674907729, "rouge1_recall_stderr": 0.005387840357836537, "rouge2_fmeasure": 0.06253675704279393, "rouge2_fmeasure_stderr": 0.0012350283375229683, "rouge2_precision": 0.03959861804048329, "rouge2_precision_stderr": 0.0008790815089921375, "rouge2_recall": 0.21857768529907604, "rouge2_recall_stderr": 0.003978406350005915, "rougeL_fmeasure": 0.12041670906511595, "rougeL_fmeasure_stderr": 0.001724997794417473, "rougeL_precision": 0.0765488634109198, "rougeL_precision_stderr": 0.001262760988042247, "rougeL_recall": 0.3942968542813885, "rougeL_recall_stderr": 0.004825967992749896, "rougeLsum_fmeasure": 0.12422716343042028, "rougeLsum_fmeasure_stderr": 0.0018397851260800163, "rougeLsum_precision": 0.07912745617089588, "rougeLsum_precision_stderr": 0.0013596543752117662, "rougeLsum_recall": 0.40482037642139057, "rougeLsum_recall_stderr": 0.004938559564217245}}, "3": {"PALM_prompt": {"bleu": 0.8278535585588646, "bleu_stderr": 0.04101323263962433, "rouge1_fmeasure": 0.13488847581723404, "rouge1_fmeasure_stderr": 0.0019541441973022983, "rouge1_precision": 0.08547615960283327, "rouge1_precision_stderr": 0.0014631064392462048, "rouge1_recall": 0.45233724476476256, "rouge1_recall_stderr": 0.005498610961440376, "rouge2_fmeasure": 0.06437212669435428, "rouge2_fmeasure_stderr": 0.0012436500824994457, "rouge2_precision": 0.04064020009202515, "rouge2_precision_stderr": 0.0009117668832831653, "rouge2_recall": 0.23147273606302815, "rouge2_recall_stderr": 0.004055355768121839, "rougeL_fmeasure": 0.12265416975642841, "rougeL_fmeasure_stderr": 0.001687981425852585, "rougeL_precision": 0.07766706751152817, "rougeL_precision_stderr": 0.0012705151561288445, "rougeL_recall": 0.4116826372221156, "rougeL_recall_stderr": 0.004846073095478439, "rougeLsum_fmeasure": 0.12722726363829323, "rougeLsum_fmeasure_stderr": 0.0018316120685934315, "rougeLsum_precision": 0.08067112264899551, "rougeLsum_precision_stderr": 0.0013779713860748017, "rougeLsum_recall": 0.42508315288079185, "rougeLsum_recall_stderr": 0.005020947504999342}}, "4": {"PALM_prompt": {"bleu": 0.8696996582752973, "bleu_stderr": 0.06098328946071962, "rouge1_fmeasure": 0.1345378611428427, "rouge1_fmeasure_stderr": 0.0019444813188940376, "rouge1_precision": 0.0846654378867452, "rouge1_precision_stderr": 0.0014210010721050707, "rouge1_recall": 0.4578457479151435, "rouge1_recall_stderr": 0.005514991901446975, "rouge2_fmeasure": 0.06331896436631664, "rouge2_fmeasure_stderr": 0.0012304846406140408, "rouge2_precision": 0.03959585063348627, "rouge2_precision_stderr": 0.000862580003329711, "rouge2_recall": 0.2318178313336565, "rouge2_recall_stderr": 0.0041148040681156135, "rougeL_fmeasure": 0.1206116472621873, "rougeL_fmeasure_stderr": 0.001620078997028922, "rougeL_precision": 0.07578970344610945, "rougeL_precision_stderr": 0.0011783081782238954, "rougeL_recall": 0.4122041018783002, "rougeL_recall_stderr": 0.004808418678515961, "rougeLsum_fmeasure": 0.12652519308473198, "rougeLsum_fmeasure_stderr": 0.0018015979293605463, "rougeLsum_precision": 0.0796291662268957, "rougeLsum_precision_stderr": 0.001316435535538898, "rougeLsum_recall": 0.43058423280412716, "rougeLsum_recall_stderr": 0.005076088365482536}}, "5": {"PALM_prompt": {"bleu": 0.9386565201757037, "bleu_stderr": 0.044526839780327905, "rouge1_fmeasure": 0.13836362229996832, "rouge1_fmeasure_stderr": 0.001893431540140422, "rouge1_precision": 0.08665394421115923, "rouge1_precision_stderr": 0.0013765101453522592, "rouge1_recall": 0.479351769718965, "rouge1_recall_stderr": 0.00548474489542107, "rouge2_fmeasure": 0.06552803780701107, "rouge2_fmeasure_stderr": 0.001201220687887674, "rouge2_precision": 0.04073112194630253, "rouge2_precision_stderr": 0.0008342579281972372, "rouge2_recall": 0.24709583361079115, "rouge2_recall_stderr": 0.004288275564287053, "rougeL_fmeasure": 0.12284158062218388, "rougeL_fmeasure_stderr": 0.0015900050300239478, "rougeL_precision": 0.07688627300671028, "rougeL_precision_stderr": 0.0011617752110929672, "rougeL_recall": 0.4288123063878505, "rougeL_recall_stderr": 0.004826731215989172, "rougeLsum_fmeasure": 0.1301416572009741, "rougeLsum_fmeasure_stderr": 0.001768541697398853, "rougeLsum_precision": 0.08154653189712766, "rougeLsum_precision_stderr": 0.001288193874235195, "rougeLsum_recall": 0.4505990363238062, "rougeLsum_recall_stderr": 0.005059301966187745}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.4010466021962698, "bleu_stderr": 0.05693469656785709, "rouge1_fmeasure": 0.16422245329729376, "rouge1_fmeasure_stderr": 0.0018151110735496203, "rouge1_precision": 0.13997262682188616, "rouge1_precision_stderr": 0.0018152662704601968, "rouge1_recall": 0.23988301526777517, "rouge1_recall_stderr": 0.0026425508349757127, "rouge2_fmeasure": 0.03235069293218825, "rouge2_fmeasure_stderr": 0.0008205093824111827, "rouge2_precision": 0.02739555088551612, "rouge2_precision_stderr": 0.0007299475693711506, "rouge2_recall": 0.04882561093577656, "rouge2_recall_stderr": 0.0013519389814047277, "rougeL_fmeasure": 0.1298012454573935, "rougeL_fmeasure_stderr": 0.0013082389095494423, "rougeL_precision": 0.10940153468767774, "rougeL_precision_stderr": 0.0012797812738055785, "rougeL_recall": 0.19392296248486443, "rougeL_recall_stderr": 0.0021299443087579575, "rougeLsum_fmeasure": 0.15178310664024564, "rougeLsum_fmeasure_stderr": 0.0016581127885119964, "rougeLsum_precision": 0.12920003480420952, "rougeLsum_precision_stderr": 0.0016583776510762952, "rougeLsum_recall": 0.22237769560119033, "rougeLsum_recall_stderr": 0.002445338658648684}}, "1": {"tldr_en": {"bleu": 2.6792767534985105, "bleu_stderr": 0.08050348994884776, "rouge1_fmeasure": 0.22176158764199283, "rouge1_fmeasure_stderr": 0.0019496812102440851, "rouge1_precision": 0.19237806407108246, "rouge1_precision_stderr": 0.002156616087328965, "rouge1_recall": 0.3212993636930355, "rouge1_recall_stderr": 0.002829724921518021, "rouge2_fmeasure": 0.05436564304591471, "rouge2_fmeasure_stderr": 0.0010398581680374484, "rouge2_precision": 0.04730550033705585, "rouge2_precision_stderr": 0.0010038562816699207, "rouge2_recall": 0.0810126790953652, "rouge2_recall_stderr": 0.0016920263323925329, "rougeL_fmeasure": 0.15298606072602197, "rougeL_fmeasure_stderr": 0.001269522698605816, "rougeL_precision": 0.13189452873558555, "rougeL_precision_stderr": 0.0014440357444886517, "rougeL_recall": 0.22728266255319154, "rougeL_recall_stderr": 0.0021740082956540176, "rougeLsum_fmeasure": 0.20773701812397452, "rougeLsum_fmeasure_stderr": 0.0018267476451028011, "rougeLsum_precision": 0.1799760146194542, "rougeLsum_precision_stderr": 0.002013284357082607, "rougeLsum_recall": 0.3015175800896575, "rougeLsum_recall_stderr": 0.0026743484362997554}}, "2": {"tldr_en": {"bleu": 2.825588151177289, "bleu_stderr": 0.0827483173505062, "rouge1_fmeasure": 0.21881031202295378, "rouge1_fmeasure_stderr": 0.0018340980892655135, "rouge1_precision": 0.19587403318777896, "rouge1_precision_stderr": 0.002246482935330373, "rouge1_recall": 0.3104623013424553, "rouge1_recall_stderr": 0.0026357716525505985, "rouge2_fmeasure": 0.05407980043809886, "rouge2_fmeasure_stderr": 0.0010322675581464652, "rouge2_precision": 0.049518456494770303, "rouge2_precision_stderr": 0.001177357025652893, "rouge2_recall": 0.07843155253080596, "rouge2_recall_stderr": 0.0016707411483431178, "rougeL_fmeasure": 0.15447333837028793, "rougeL_fmeasure_stderr": 0.0012811266282334365, "rougeL_precision": 0.13795120173138903, "rougeL_precision_stderr": 0.001669101235947338, "rougeL_recall": 0.22381109650316425, "rougeL_recall_stderr": 0.002115149596829255, "rougeLsum_fmeasure": 0.20577620783096848, "rougeLsum_fmeasure_stderr": 0.0017206650892505897, "rougeLsum_precision": 0.18399939129198817, "rougeLsum_precision_stderr": 0.0021107295487964614, "rougeLsum_recall": 0.2924275031032992, "rougeLsum_recall_stderr": 0.0024986416120394883}}, "3": {"tldr_en": {"bleu": 2.77140298721746, "bleu_stderr": 0.09911601058676267, "rouge1_fmeasure": 0.17955806504481292, "rouge1_fmeasure_stderr": 0.002195205258030929, "rouge1_precision": 0.1647227013547415, "rouge1_precision_stderr": 0.0024792520261390483, "rouge1_recall": 0.2560613183847905, "rouge1_recall_stderr": 0.0032797831033041618, "rouge2_fmeasure": 0.04429422701774445, "rouge2_fmeasure_stderr": 0.0010178187766663955, "rouge2_precision": 0.040393011250336536, "rouge2_precision_stderr": 0.001120492765195676, "rouge2_recall": 0.06579426072456108, "rouge2_recall_stderr": 0.001694481658818446, "rougeL_fmeasure": 0.12746828061030624, "rougeL_fmeasure_stderr": 0.0015396980890683188, "rougeL_precision": 0.11737676404806478, "rougeL_precision_stderr": 0.0018604626033532456, "rougeL_recall": 0.1856490443924171, "rougeL_recall_stderr": 0.00253379229574718, "rougeLsum_fmeasure": 0.1689495507422565, "rougeLsum_fmeasure_stderr": 0.0020580481966186253, "rougeLsum_precision": 0.15523651118051682, "rougeLsum_precision_stderr": 0.0023598380194680005, "rougeLsum_recall": 0.24112578036228802, "rougeLsum_recall_stderr": 0.0030888339817801563}}, "4": {"tldr_en": {"bleu": 0.6374428010243339, "bleu_stderr": 0.04679817619985886, "rouge1_fmeasure": 0.05724507901787019, "rouge1_fmeasure_stderr": 0.001923136290184156, "rouge1_precision": 0.053177399565422716, "rouge1_precision_stderr": 0.001969539589668854, "rouge1_recall": 0.08460445332976693, "rouge1_recall_stderr": 0.002887654568198146, "rouge2_fmeasure": 0.014128667931700438, "rouge2_fmeasure_stderr": 0.0006962023161566057, "rouge2_precision": 0.012859547969705542, "rouge2_precision_stderr": 0.000726325510216138, "rouge2_recall": 0.02237244864266085, "rouge2_recall_stderr": 0.0012034662851936587, "rougeL_fmeasure": 0.042868526761057124, "rougeL_fmeasure_stderr": 0.0014217476738280137, "rougeL_precision": 0.03993285011532237, "rougeL_precision_stderr": 0.0014928569276828109, "rougeL_recall": 0.06466228514995502, "rougeL_recall_stderr": 0.0022622950372018576, "rougeLsum_fmeasure": 0.053934021939145045, "rougeLsum_fmeasure_stderr": 0.0018135115805431904, "rougeLsum_precision": 0.05008717864701033, "rougeLsum_precision_stderr": 0.0018614454895917413, "rougeLsum_recall": 0.07995227312474681, "rougeLsum_recall_stderr": 0.0027408841913450226}}, "5": {"tldr_en": {"bleu": 1.5497714003816197e-06, "bleu_stderr": 2.826544891292017e-06, "rouge1_fmeasure": 0.009409482800898775, "rouge1_fmeasure_stderr": 0.0008719922868900455, "rouge1_precision": 0.009250162353650573, "rouge1_precision_stderr": 0.0009501892043502089, "rouge1_recall": 0.01399225543923628, "rouge1_recall_stderr": 0.0013479443593293063, "rouge2_fmeasure": 0.0024954950292378434, "rouge2_fmeasure_stderr": 0.00030758521273803235, "rouge2_precision": 0.0025132950634529213, "rouge2_precision_stderr": 0.0003496566473256293, "rouge2_recall": 0.003986174570934941, "rouge2_recall_stderr": 0.0005228969007076435, "rougeL_fmeasure": 0.007016931130854418, "rougeL_fmeasure_stderr": 0.0006474630715093982, "rougeL_precision": 0.006939530851512524, "rougeL_precision_stderr": 0.000721287497804254, "rougeL_recall": 0.010674568197211812, "rougeL_recall_stderr": 0.0010578455964358668, "rougeLsum_fmeasure": 0.008928183444317063, "rougeLsum_fmeasure_stderr": 0.0008250504967685091, "rougeLsum_precision": 0.008770387592628782, "rougeLsum_precision_stderr": 0.0008958471929010777, "rougeLsum_recall": 0.013287426441297979, "rougeLsum_recall_stderr": 0.0012768296011753365}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 0.01707387064925112, "bleu_stderr": 0.004548339499332125, "rouge1_fmeasure": 0.01833385014011665, "rouge1_fmeasure_stderr": 0.0004556651351480112, "rouge1_precision": 0.01479209987025161, "rouge1_precision_stderr": 0.0003848187529004132, "rouge1_recall": 0.02647907855108807, "rouge1_recall_stderr": 0.0007373776368265799, "rouge2_fmeasure": 0.00022602188070215841, "rouge2_fmeasure_stderr": 4.551736869387828e-05, "rouge2_precision": 0.00018468533574224637, "rouge2_precision_stderr": 3.7035782299895355e-05, "rouge2_recall": 0.00032184358555587336, "rouge2_recall_stderr": 6.80865158511292e-05, "rougeL_fmeasure": 0.01828543709345876, "rougeL_fmeasure_stderr": 0.000449785707890762, "rougeL_precision": 0.014749675627827365, "rougeL_precision_stderr": 0.0003794521861304636, "rougeL_recall": 0.02642067669572227, "rougeL_recall_stderr": 0.0007319703340695989, "rougeLsum_fmeasure": 0.017042834318925764, "rougeLsum_fmeasure_stderr": 0.00038117023392555423, "rougeLsum_precision": 0.01381746395527955, "rougeLsum_precision_stderr": 0.0003369009463365385, "rougeLsum_recall": 0.024406964608590324, "rougeLsum_recall_stderr": 0.0005979225418060756}}, "1": {"generate_text_restaurant": {"bleu": 11.199945366026236, "bleu_stderr": 0.09740891554529413, "rouge1_fmeasure": 0.43361162405107295, "rouge1_fmeasure_stderr": 0.0024498717646033665, "rouge1_precision": 0.5190142019208609, "rouge1_precision_stderr": 0.003327240390036289, "rouge1_recall": 0.4114616078138066, "rouge1_recall_stderr": 0.0030408033259645612, "rouge2_fmeasure": 0.1983453767330724, "rouge2_fmeasure_stderr": 0.0019553142654631156, "rouge2_precision": 0.24092206705754915, "rouge2_precision_stderr": 0.0025432949505695425, "rouge2_recall": 0.18797583914402394, "rouge2_recall_stderr": 0.002107165588256214, "rougeL_fmeasure": 0.315514252090379, "rougeL_fmeasure_stderr": 0.0020950130049756485, "rougeL_precision": 0.3810297781145268, "rougeL_precision_stderr": 0.002955659050147338, "rougeL_recall": 0.2982904326283383, "rougeL_recall_stderr": 0.002441126924534855, "rougeLsum_fmeasure": 0.3556790279405754, "rougeLsum_fmeasure_stderr": 0.0023552583830999735, "rougeLsum_precision": 0.4272477194499663, "rougeLsum_precision_stderr": 0.0031895534936824997, "rougeLsum_recall": 0.33692836067640447, "rougeLsum_recall_stderr": 0.0027567274786219256}}, "2": {"generate_text_restaurant": {"bleu": 12.752880813365183, "bleu_stderr": 0.22532887560628184, "rouge1_fmeasure": 0.4576720641979181, "rouge1_fmeasure_stderr": 0.0022953942764252673, "rouge1_precision": 0.5483859178177682, "rouge1_precision_stderr": 0.003284509279619272, "rouge1_recall": 0.4329119599793277, "rouge1_recall_stderr": 0.002935675677350969, "rouge2_fmeasure": 0.22030084182668652, "rouge2_fmeasure_stderr": 0.0020287670329249274, "rouge2_precision": 0.26853962452756747, "rouge2_precision_stderr": 0.002740945324943779, "rouge2_recall": 0.20828673845347298, "rouge2_recall_stderr": 0.0021908686840527536, "rougeL_fmeasure": 0.33784951726273604, "rougeL_fmeasure_stderr": 0.002092067006211518, "rougeL_precision": 0.407475473407987, "rougeL_precision_stderr": 0.0030181731331604795, "rougeL_recall": 0.31883364076878173, "rougeL_recall_stderr": 0.002461630929460497, "rougeLsum_fmeasure": 0.38152814100163385, "rougeLsum_fmeasure_stderr": 0.002318898465385505, "rougeLsum_precision": 0.45802173612428515, "rougeLsum_precision_stderr": 0.003228180984559956, "rougeLsum_recall": 0.3606321592898537, "rougeLsum_recall_stderr": 0.002748101165505275}}, "3": {"generate_text_restaurant": {"bleu": 13.567475379286549, "bleu_stderr": 0.1880502425341883, "rouge1_fmeasure": 0.46365491542004894, "rouge1_fmeasure_stderr": 0.0021794833674578123, "rouge1_precision": 0.54296137339216, "rouge1_precision_stderr": 0.0032385304204834925, "rouge1_recall": 0.4468637477572891, "rouge1_recall_stderr": 0.002870747282334814, "rouge2_fmeasure": 0.22644283092674808, "rouge2_fmeasure_stderr": 0.0020104468971516875, "rouge2_precision": 0.268879550509031, "rouge2_precision_stderr": 0.0026847549706603357, "rouge2_recall": 0.21872430008911764, "rouge2_recall_stderr": 0.0022357966811142774, "rougeL_fmeasure": 0.3445418845511442, "rougeL_fmeasure_stderr": 0.002026802374084494, "rougeL_precision": 0.40563436021398125, "rougeL_precision_stderr": 0.0029671089231426426, "rougeL_recall": 0.33158522150890407, "rougeL_recall_stderr": 0.0024524778139217965, "rougeLsum_fmeasure": 0.3905619856893357, "rougeLsum_fmeasure_stderr": 0.002253731478640236, "rougeLsum_precision": 0.457618460997299, "rougeLsum_precision_stderr": 0.003163617105952389, "rougeLsum_recall": 0.37651908361075154, "rougeLsum_recall_stderr": 0.0027495326994019364}}, "4": {"generate_text_restaurant": {"bleu": 13.740384950752064, "bleu_stderr": 0.17474565384186433, "rouge1_fmeasure": 0.4606344386510922, "rouge1_fmeasure_stderr": 0.0021643969739297475, "rouge1_precision": 0.51943848236802, "rouge1_precision_stderr": 0.0031779058467164764, "rouge1_recall": 0.4567820792568219, "rouge1_recall_stderr": 0.002851642014055284, "rouge2_fmeasure": 0.22570040278921377, "rouge2_fmeasure_stderr": 0.0020088114026586526, "rouge2_precision": 0.25737502763838105, "rouge2_precision_stderr": 0.0026242680468160895, "rouge2_recall": 0.2245153764885056, "rouge2_recall_stderr": 0.0022588441708384973, "rougeL_fmeasure": 0.3427780842217158, "rougeL_fmeasure_stderr": 0.0020244481019983177, "rougeL_precision": 0.3876917725288397, "rougeL_precision_stderr": 0.0028653337007260647, "rougeL_recall": 0.3397952534482862, "rougeL_recall_stderr": 0.0024656674082997676, "rougeLsum_fmeasure": 0.3902532373292503, "rougeLsum_fmeasure_stderr": 0.0022482737601443, "rougeLsum_precision": 0.43916794242095064, "rougeLsum_precision_stderr": 0.0030589422127270337, "rougeLsum_recall": 0.3876015303869884, "rougeLsum_recall_stderr": 0.0027798320723785553}}, "5": {"generate_text_restaurant": {"bleu": 12.772366014464684, "bleu_stderr": 0.1727094167530513, "rouge1_fmeasure": 0.45315037221898985, "rouge1_fmeasure_stderr": 0.002063099268846445, "rouge1_precision": 0.4849957590476985, "rouge1_precision_stderr": 0.0029633904151518614, "rouge1_recall": 0.4698079682696499, "rouge1_recall_stderr": 0.0028147920332754844, "rouge2_fmeasure": 0.2186838500921512, "rouge2_fmeasure_stderr": 0.0018776056949733047, "rouge2_precision": 0.23597412151168465, "rouge2_precision_stderr": 0.0023313187461128483, "rouge2_recall": 0.22775944680052645, "rouge2_recall_stderr": 0.002217444405292992, "rougeL_fmeasure": 0.33617919401288165, "rougeL_fmeasure_stderr": 0.0019141754215681863, "rougeL_precision": 0.36121121776556825, "rougeL_precision_stderr": 0.002645618381599165, "rougeL_recall": 0.3483500842464673, "rougeL_recall_stderr": 0.0024310911003668787, "rougeLsum_fmeasure": 0.3862609489154149, "rougeLsum_fmeasure_stderr": 0.0021169304456593015, "rougeLsum_precision": 0.41312019009298706, "rougeLsum_precision_stderr": 0.0028317325884933, "rougeLsum_recall": 0.40082494576214567, "rougeLsum_recall_stderr": 0.0027213945607275796}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.7916845418214005, "bleu_stderr": 0.07828212807526311, "rouge1_fmeasure": 0.20406385886176096, "rouge1_fmeasure_stderr": 0.00258155674612985, "rouge1_precision": 0.1636017883690539, "rouge1_precision_stderr": 0.0024265639944645607, "rouge1_recall": 0.3135411100199371, "rouge1_recall_stderr": 0.004414059386580781, "rouge2_fmeasure": 0.042825803126534195, "rouge2_fmeasure_stderr": 0.00160599002891498, "rouge2_precision": 0.03326860572215188, "rouge2_precision_stderr": 0.0013712483892843969, "rouge2_recall": 0.06935361806518704, "rouge2_recall_stderr": 0.002630864064398201, "rougeL_fmeasure": 0.154429756081877, "rougeL_fmeasure_stderr": 0.0019969002281278216, "rougeL_precision": 0.12376190274002842, "rougeL_precision_stderr": 0.0019110587602701528, "rougeL_recall": 0.23856624379837527, "rougeL_recall_stderr": 0.0034515198934126907, "rougeLsum_fmeasure": 0.1585898458477123, "rougeLsum_fmeasure_stderr": 0.0021649602354550605, "rougeLsum_precision": 0.12670301550297952, "rougeLsum_precision_stderr": 0.001984240932547222, "rougeLsum_recall": 0.2456847137827434, "rougeLsum_recall_stderr": 0.0037888888942200177}}, "1": {"article_DOC_summary": {"bleu": 1.3135114346532981, "bleu_stderr": 0.08463533356367237, "rouge1_fmeasure": 0.17216405786002645, "rouge1_fmeasure_stderr": 0.002413004919727933, "rouge1_precision": 0.12258398799437052, "rouge1_precision_stderr": 0.0017962630199380857, "rouge1_recall": 0.3012382161995991, "rouge1_recall_stderr": 0.004139509463692997, "rouge2_fmeasure": 0.032550109418001044, "rouge2_fmeasure_stderr": 0.0013323022688404391, "rouge2_precision": 0.022923096739945113, "rouge2_precision_stderr": 0.0009396939072749053, "rouge2_recall": 0.058554066932389494, "rouge2_recall_stderr": 0.002474769338098033, "rougeL_fmeasure": 0.13422605654232356, "rougeL_fmeasure_stderr": 0.0017698404507476406, "rougeL_precision": 0.0953766892949565, "rougeL_precision_stderr": 0.0013021773787458971, "rougeL_recall": 0.2362381442835074, "rougeL_recall_stderr": 0.0031828562476237457, "rougeLsum_fmeasure": 0.13702592659449045, "rougeLsum_fmeasure_stderr": 0.0019551406042742046, "rougeLsum_precision": 0.09729740585688308, "rougeLsum_precision_stderr": 0.001433871342903216, "rougeLsum_recall": 0.24153880156299268, "rougeLsum_recall_stderr": 0.003500903202746728}}, "2": {"article_DOC_summary": {"bleu": 1.2969951394913493, "bleu_stderr": 0.06867031320524596, "rouge1_fmeasure": 0.16848679088873222, "rouge1_fmeasure_stderr": 0.0023805185438281235, "rouge1_precision": 0.12014057910525737, "rouge1_precision_stderr": 0.00177027208032182, "rouge1_recall": 0.2937362802990173, "rouge1_recall_stderr": 0.0040558921767481415, "rouge2_fmeasure": 0.032592328628319726, "rouge2_fmeasure_stderr": 0.001360334296634944, "rouge2_precision": 0.023037471663706975, "rouge2_precision_stderr": 0.0009651714294322547, "rouge2_recall": 0.05808812201139429, "rouge2_recall_stderr": 0.002494816691771811, "rougeL_fmeasure": 0.13752060575301803, "rougeL_fmeasure_stderr": 0.0018652017270717643, "rougeL_precision": 0.09796298255577943, "rougeL_precision_stderr": 0.0013818612760360376, "rougeL_recall": 0.24059048844697575, "rougeL_recall_stderr": 0.0032525841201501613, "rougeLsum_fmeasure": 0.13274693169694082, "rougeLsum_fmeasure_stderr": 0.0019432835336852861, "rougeLsum_precision": 0.09437688045356053, "rougeLsum_precision_stderr": 0.0014232755198755626, "rougeLsum_recall": 0.23332253770052824, "rougeLsum_recall_stderr": 0.0034512361504183474}}, "3": {"article_DOC_summary": {"bleu": 1.327235232469952, "bleu_stderr": 0.09959209280385814, "rouge1_fmeasure": 0.16364844726335212, "rouge1_fmeasure_stderr": 0.002540088417740363, "rouge1_precision": 0.11962719565205662, "rouge1_precision_stderr": 0.002016131135992487, "rouge1_recall": 0.2790081357700044, "rouge1_recall_stderr": 0.0043060099015184835, "rouge2_fmeasure": 0.03286054820200277, "rouge2_fmeasure_stderr": 0.0013434565504320645, "rouge2_precision": 0.02385360834922912, "rouge2_precision_stderr": 0.000982041326291719, "rouge2_recall": 0.057563110969334454, "rouge2_recall_stderr": 0.002474970323879015, "rougeL_fmeasure": 0.13539724940510672, "rougeL_fmeasure_stderr": 0.0020807935996877674, "rougeL_precision": 0.09886948142069724, "rougeL_precision_stderr": 0.0016489525812605937, "rougeL_recall": 0.23196290924579455, "rougeL_recall_stderr": 0.003657598924470169, "rougeLsum_fmeasure": 0.12875250329964805, "rougeLsum_fmeasure_stderr": 0.0020505398481043147, "rougeLsum_precision": 0.09403709487175377, "rougeLsum_precision_stderr": 0.0016315538581778424, "rougeLsum_recall": 0.22096634372218205, "rougeLsum_recall_stderr": 0.0036039318241550657}}, "4": {"article_DOC_summary": {"bleu": 0.720494287805737, "bleu_stderr": 0.13337005008364483, "rouge1_fmeasure": 0.04714699127177818, "rouge1_fmeasure_stderr": 0.002660932299544834, "rouge1_precision": 0.04098939178475802, "rouge1_precision_stderr": 0.0026204420208068035, "rouge1_recall": 0.07322660875950299, "rouge1_recall_stderr": 0.0042459458791253716, "rouge2_fmeasure": 0.01002600655383815, "rouge2_fmeasure_stderr": 0.0009249273635939417, "rouge2_precision": 0.009005101634115067, "rouge2_precision_stderr": 0.00121171937903932, "rouge2_recall": 0.016152720952389045, "rouge2_recall_stderr": 0.0015904264999107502, "rougeL_fmeasure": 0.038851245646855916, "rougeL_fmeasure_stderr": 0.002177065038104623, "rougeL_precision": 0.034375344099908396, "rougeL_precision_stderr": 0.002283572080585189, "rougeL_recall": 0.06037717457617166, "rougeL_recall_stderr": 0.0035163081114451514, "rougeLsum_fmeasure": 0.03782418886463528, "rougeLsum_fmeasure_stderr": 0.0021755326176048475, "rougeLsum_precision": 0.03382829886719806, "rougeLsum_precision_stderr": 0.002342085999586738, "rougeLsum_recall": 0.05845333975676655, "rougeLsum_recall_stderr": 0.003459845391454891}}, "5": {"article_DOC_summary": {"bleu": 1.437491909962072e-37, "bleu_stderr": 6.679183284996885e-31, "rouge1_fmeasure": 0.002482537431673434, "rouge1_fmeasure_stderr": 0.0006590331629581881, "rouge1_precision": 0.0027818328091416475, "rouge1_precision_stderr": 0.0007401612256325405, "rouge1_recall": 0.002330798812107932, "rouge1_recall_stderr": 0.0006256804823539565, "rouge2_fmeasure": 0.00028593668938742907, "rouge2_fmeasure_stderr": 0.00011751104642033578, "rouge2_precision": 0.0003101211896994361, "rouge2_precision_stderr": 0.00012661794961734148, "rouge2_recall": 0.0002680102915951972, "rouge2_recall_stderr": 0.00011124280815470673, "rougeL_fmeasure": 0.001846067784976754, "rougeL_fmeasure_stderr": 0.0005022326643801285, "rougeL_precision": 0.0020462530294442205, "rougeL_precision_stderr": 0.0005534615847200946, "rougeL_recall": 0.0017580325391528475, "rougeL_recall_stderr": 0.0004906057300283716, "rougeLsum_fmeasure": 0.002260942501090202, "rougeLsum_fmeasure_stderr": 0.0006097815513991564, "rougeLsum_precision": 0.0025260844263122434, "rougeLsum_precision_stderr": 0.0006786126789253857, "rougeLsum_recall": 0.002133328291896597, "rougeLsum_recall_stderr": 0.000585991073578324}}}} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..4006210de7dddbbd05495dd476f61ceedb04a060 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4177738397053596, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.052439714987504826 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07401331365029154, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001555945380008501 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.309544677126812, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004598258018956965 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11313553204694117, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020976821294602234 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03523505191827857, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009392296781654515 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.15329454407408277, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003251728201432321 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05411413548524944, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013020734544028827 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07061132409656197, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014031957668770357 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.30042353738636374, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0044778245769371994 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10845705136602556, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0019284471387199143 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07049851230067716, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001450359178267902 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.296810156480222, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0043631335921961835 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10792394253569278, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019640770726289487 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..72f37e3e634c5ffb5bc2c91577327fa1f85da1fe --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5808615724978651, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03393350967485746 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08183691647303251, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0015166625147494993 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.40093348191479217, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005450906036616762 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12727475120836446, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002035424606741712 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.039062153239498784, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009349863984338872 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20112348772170943, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003804920107675235 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.06096091447803779, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012946551599852026 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07650521343895433, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013445352921906551 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.37517446453693076, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004982125783681737 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1192836731407637, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001834016996545526 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07726225443418276, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001411238354454551 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3769882191273612, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004973103856227287 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.12012804167712486, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018942369664582516 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..baa710b542ec62d95d2cf75672fd7d0d4d8907a2 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6974388179157304, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.030575587628070142 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08378329306693072, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001459322065449314 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4295176674907729, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005387840357836537 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.13158075248220336, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019778747548532725 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03959861804048329, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008790815089921375 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21857768529907604, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003978406350005915 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.06253675704279393, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012350283375229683 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.0765488634109198, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001262760988042247 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3942968542813885, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004825967992749896 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.12041670906511595, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001724997794417473 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07912745617089588, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013596543752117662 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.40482037642139057, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004938559564217245 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.12422716343042028, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018397851260800163 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..1f6991fdb5ae73f730076259aed5b27ed9c9dffc --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.8278535585588646, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04101323263962433 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08547615960283327, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014631064392462048 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.45233724476476256, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005498610961440376 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.13488847581723404, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019541441973022983 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.04064020009202515, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009117668832831653 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.23147273606302815, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004055355768121839 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.06437212669435428, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012436500824994457 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07766706751152817, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012705151561288445 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.4116826372221156, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004846073095478439 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.12265416975642841, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001687981425852585 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.08067112264899551, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013779713860748017 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.42508315288079185, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005020947504999342 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.12722726363829323, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018316120685934315 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..aa540722eedc6200892d2d8169a9cee02f47e890 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.8696996582752973, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06098328946071962 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0846654378867452, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014210010721050707 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4578457479151435, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005514991901446975 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1345378611428427, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019444813188940376 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03959585063348627, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000862580003329711 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2318178313336565, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0041148040681156135 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.06331896436631664, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012304846406140408 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07578970344610945, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011783081782238954 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.4122041018783002, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004808418678515961 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1206116472621873, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001620078997028922 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0796291662268957, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001316435535538898 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.43058423280412716, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005076088365482536 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.12652519308473198, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018015979293605463 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..d93502da200926766fa38e453521a74a8c87debc --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.9386565201757037, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.044526839780327905 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08665394421115923, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013765101453522592 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.479351769718965, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00548474489542107 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.13836362229996832, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001893431540140422 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.04073112194630253, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008342579281972372 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.24709583361079115, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004288275564287053 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.06552803780701107, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001201220687887674 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07688627300671028, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011617752110929672 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.4288123063878505, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004826731215989172 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.12284158062218388, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015900050300239478 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.08154653189712766, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001288193874235195 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.4505990363238062, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.005059301966187745 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1301416572009741, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001768541697398853 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..f3198621643f2ca02a81af15cc63687821fef5d3 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.13997262682188616, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018152662704601968 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.23988301526777517, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0026425508349757127 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.16422245329729376, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018151110735496203 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.02739555088551612, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007299475693711506 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04882561093577656, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0013519389814047277 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03235069293218825, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008205093824111827 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10940153468767774, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012797812738055785 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.19392296248486443, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0021299443087579575 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1298012454573935, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013082389095494423 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.12920003480420952, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016583776510762952 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.22237769560119033, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002445338658648684 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15178310664024564, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016581127885119964 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.4010466021962698, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05693469656785709 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..2ba074592f48add413b53fb2d7494921ee56788b --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.19237806407108246, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002156616087328965 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.3212993636930355, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002829724921518021 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.22176158764199283, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019496812102440851 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04730550033705585, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010038562816699207 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0810126790953652, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016920263323925329 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05436564304591471, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010398581680374484 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.13189452873558555, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014440357444886517 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.22728266255319154, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0021740082956540176 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15298606072602197, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001269522698605816 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1799760146194542, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002013284357082607 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.3015175800896575, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026743484362997554 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.20773701812397452, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018267476451028011 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.6792767534985105, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08050348994884776 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e979075b6808ec8877b6c2da4d7f361f01cce538 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.19587403318777896, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002246482935330373 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.3104623013424553, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0026357716525505985 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.21881031202295378, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018340980892655135 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.049518456494770303, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001177357025652893 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.07843155253080596, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016707411483431178 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05407980043809886, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010322675581464652 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.13795120173138903, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001669101235947338 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.22381109650316425, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002115149596829255 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15447333837028793, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012811266282334365 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.18399939129198817, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0021107295487964614 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2924275031032992, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0024986416120394883 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.20577620783096848, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017206650892505897 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.825588151177289, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0827483173505062 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..5bbdf1f064e5b98679f73fa7181b39b440e4210c --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1647227013547415, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0024792520261390483 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2560613183847905, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0032797831033041618 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17955806504481292, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002195205258030929 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.040393011250336536, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001120492765195676 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06579426072456108, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001694481658818446 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04429422701774445, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010178187766663955 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11737676404806478, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0018604626033532456 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1856490443924171, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00253379229574718 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12746828061030624, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015396980890683188 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.15523651118051682, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0023598380194680005 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.24112578036228802, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0030888339817801563 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1689495507422565, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020580481966186253 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.77140298721746, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09911601058676267 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..a9bee47ccbbf20f351cbe3fa2329740c7316ad63 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.053177399565422716, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001969539589668854 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.08460445332976693, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002887654568198146 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.05724507901787019, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001923136290184156 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.012859547969705542, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000726325510216138 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.02237244864266085, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012034662851936587 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.014128667931700438, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0006962023161566057 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.03993285011532237, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014928569276828109 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.06466228514995502, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022622950372018576 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.042868526761057124, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014217476738280137 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.05008717864701033, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018614454895917413 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.07995227312474681, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027408841913450226 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.053934021939145045, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018135115805431904 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.6374428010243339, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04679817619985886 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..0025d575e87a286d601e1f7ca9ee56726883a75b --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.009250162353650573, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0009501892043502089 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.01399225543923628, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0013479443593293063 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.009409482800898775, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0008719922868900455 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0025132950634529213, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0003496566473256293 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.003986174570934941, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0005228969007076435 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0024954950292378434, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00030758521273803235 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.006939530851512524, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.000721287497804254 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.010674568197211812, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0010578455964358668 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.007016931130854418, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006474630715093982 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.008770387592628782, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0008958471929010777 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.013287426441297979, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0012768296011753365 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.008928183444317063, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0008250504967685091 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5497714003816197e-06, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 2.826544891292017e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..74c02fbaebafe7ae48f1c6a0fb1d69b7b25cf849 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.01707387064925112, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.004548339499332125 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.01479209987025161, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0003848187529004132 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.02647907855108807, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0007373776368265799 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.01833385014011665, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0004556651351480112 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.00018468533574224637, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 3.7035782299895355e-05 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.00032184358555587336, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 6.80865158511292e-05 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.00022602188070215841, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 4.551736869387828e-05 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.014749675627827365, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0003794521861304636 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.02642067669572227, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0007319703340695989 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.01828543709345876, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.000449785707890762 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.01381746395527955, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0003369009463365385 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.024406964608590324, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0005979225418060756 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.017042834318925764, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00038117023392555423 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..6b0fbcbd418b57e4f1a0c29cbfb577afe7a1779f --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.199945366026236, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.09740891554529413 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5190142019208609, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003327240390036289 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4114616078138066, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0030408033259645612 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.43361162405107295, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0024498717646033665 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.24092206705754915, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0025432949505695425 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.18797583914402394, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002107165588256214 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.1983453767330724, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019553142654631156 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3810297781145268, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002955659050147338 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.2982904326283383, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002441126924534855 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.315514252090379, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020950130049756485 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4272477194499663, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031895534936824997 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.33692836067640447, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027567274786219256 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3556790279405754, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023552583830999735 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..4f0cb404f5dbe953543b1bf936cf202e141ff680 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.752880813365183, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.22532887560628184 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5483859178177682, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003284509279619272 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4329119599793277, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002935675677350969 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4576720641979181, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022953942764252673 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.26853962452756747, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002740945324943779 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.20828673845347298, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021908686840527536 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.22030084182668652, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020287670329249274 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.407475473407987, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0030181731331604795 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.31883364076878173, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002461630929460497 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.33784951726273604, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002092067006211518 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.45802173612428515, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003228180984559956 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3606321592898537, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002748101165505275 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.38152814100163385, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002318898465385505 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..0f53e160526e496baaa50e868992d54b543f8c67 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.567475379286549, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1880502425341883 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.54296137339216, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032385304204834925 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4468637477572891, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002870747282334814 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.46365491542004894, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021794833674578123 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.268879550509031, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026847549706603357 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21872430008911764, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022357966811142774 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.22644283092674808, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020104468971516875 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.40563436021398125, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029671089231426426 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.33158522150890407, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024524778139217965 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3445418845511442, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002026802374084494 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.457618460997299, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003163617105952389 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.37651908361075154, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027495326994019364 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3905619856893357, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002253731478640236 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..47bc9a04144cf08b9cda749320d8c4fc6578e728 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.740384950752064, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.17474565384186433 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.51943848236802, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031779058467164764 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4567820792568219, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002851642014055284 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4606344386510922, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021643969739297475 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.25737502763838105, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026242680468160895 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2245153764885056, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022588441708384973 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.22570040278921377, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020088114026586526 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3876917725288397, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0028653337007260647 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3397952534482862, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024656674082997676 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3427780842217158, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020244481019983177 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.43916794242095064, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0030589422127270337 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3876015303869884, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027798320723785553 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3902532373292503, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022482737601443 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..9de794eee2de71654a0c812428ecd5700dfd86ce --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.772366014464684, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1727094167530513 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4849957590476985, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0029633904151518614 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4698079682696499, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028147920332754844 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.45315037221898985, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002063099268846445 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.23597412151168465, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0023313187461128483 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22775944680052645, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002217444405292992 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2186838500921512, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018776056949733047 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.36121121776556825, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002645618381599165 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3483500842464673, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024310911003668787 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.33617919401288165, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0019141754215681863 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.41312019009298706, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0028317325884933 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.40082494576214567, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027213945607275796 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3862609489154149, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021169304456593015 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_0.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e636003b13cbeef66866583bfcc4041915b7d31a --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1636017883690539, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0024265639944645607 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3135411100199371, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004414059386580781 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20406385886176096, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.00258155674612985 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03326860572215188, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0013712483892843969 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06935361806518704, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002630864064398201 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.042825803126534195, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00160599002891498 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.12376190274002842, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0019110587602701528 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23856624379837527, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034515198934126907 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.154429756081877, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019969002281278216 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.12670301550297952, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001984240932547222 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2456847137827434, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0037888888942200177 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1585898458477123, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021649602354550605 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.7916845418214005, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07828212807526311 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_1.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ac451eadcf1463bd5f28cd6011f15aedecc0b0a9 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12258398799437052, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017962630199380857 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3012382161995991, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004139509463692997 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17216405786002645, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002413004919727933 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.022923096739945113, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009396939072749053 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.058554066932389494, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002474769338098033 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.032550109418001044, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0013323022688404391 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0953766892949565, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013021773787458971 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2362381442835074, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0031828562476237457 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13422605654232356, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0017698404507476406 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09729740585688308, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001433871342903216 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24153880156299268, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003500903202746728 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13702592659449045, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019551406042742046 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.3135114346532981, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08463533356367237 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_2.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..7910ff4e6ed0074da098f61ce61a49203c780d6f --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12014057910525737, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.00177027208032182 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2937362802990173, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0040558921767481415 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.16848679088873222, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0023805185438281235 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.023037471663706975, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009651714294322547 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.05808812201139429, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002494816691771811 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.032592328628319726, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001360334296634944 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09796298255577943, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013818612760360376 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24059048844697575, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0032525841201501613 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13752060575301803, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018652017270717643 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09437688045356053, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014232755198755626 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23332253770052824, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0034512361504183474 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13274693169694082, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019432835336852861 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.2969951394913493, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.06867031320524596 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_3.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..e67a757a04108fc1a2b898e3e8763d11a8169d9c --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.11962719565205662, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002016131135992487 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2790081357700044, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0043060099015184835 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.16364844726335212, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002540088417740363 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02385360834922912, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.000982041326291719 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.057563110969334454, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002474970323879015 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03286054820200277, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0013434565504320645 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09886948142069724, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0016489525812605937 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23196290924579455, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003657598924470169 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13539724940510672, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020807935996877674 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09403709487175377, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016315538581778424 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.22096634372218205, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0036039318241550657 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.12875250329964805, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020505398481043147 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.327235232469952, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09959209280385814 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_4.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..76b006439886f8a537a9e3fd15c605299b9ffe4e --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.04098939178475802, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0026204420208068035 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.07322660875950299, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0042459458791253716 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.04714699127177818, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002660932299544834 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.009005101634115067, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00121171937903932 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.016152720952389045, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0015904264999107502 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.01002600655383815, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0009249273635939417 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.034375344099908396, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.002283572080585189 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.06037717457617166, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0035163081114451514 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.038851245646855916, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002177065038104623 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.03382829886719806, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.002342085999586738 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.05845333975676655, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003459845391454891 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03782418886463528, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021755326176048475 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.720494287805737, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.13337005008364483 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_5.json b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..da13280f4de5e282611c4de2f208a332aef134f3 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/generation/slim.4b284b84bc4seed1_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0027818328091416475, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0007401612256325405 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.002330798812107932, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0006256804823539565 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.002482537431673434, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0006590331629581881 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0003101211896994361, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00012661794961734148 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0002680102915951972, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00011124280815470673 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.00028593668938742907, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00011751104642033578 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0020462530294442205, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0005534615847200946 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0017580325391528475, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0004906057300283716 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.001846067784976754, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0005022326643801285 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0025260844263122434, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0006786126789253857 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.002133328291896597, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.000585991073578324 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.002260942501090202, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0006097815513991564 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.437491909962072e-37, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 6.679183284996885e-31 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_0.csv b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..fc3ee64f377ebf793e06b070343366110de28015 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.329,0.014865395385928367,0 +anli_r2,acc,0.32,0.014758652303574878,0 +anli_r3,acc,0.3408333333333333,0.013688600793296939,0 +arc_challenge,acc,0.26023890784982934,0.012821930225112566,0 +arc_challenge,acc_norm,0.3003412969283277,0.013395909309956997,0 +arc_easy,acc,0.6102693602693603,0.010007169391797051,0 +arc_easy,acc_norm,0.5538720538720538,0.01020005782876501,0 +boolq,acc,0.6180428134556575,0.008497851998427192,1 +cb,acc,0.48214285714285715,0.0673769750864465,1 +cb,f1,0.3335687382297552,,1 +copa,acc,0.76,0.04292346959909283,0 +hellaswag,acc,0.48028281218880703,0.004985900172317698,0 +hellaswag,acc_norm,0.6314479187412866,0.004814261966376849,0 +piqa,acc,0.7633297062023939,0.009916841655042809,0 +piqa,acc_norm,0.7665941240478781,0.009869247889520986,0 +rte,acc,0.5090252707581228,0.030091559826331334,0 +sciq,acc,0.853,0.011203415395160336,0 +sciq,acc_norm,0.773,0.013253174964763921,0 +storycloze_2016,acc,0.7215392838054516,0.010365521460604413,0 +winogrande,acc,0.5682715074980268,0.01392087211001071,0 diff --git a/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_0.json b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e337059dd12ce0bf354d9042d743335e0d297a4b --- /dev/null +++ b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.329, + "acc_stderr": 0.014865395385928367 + }, + "anli_r2": { + "acc": 0.32, + "acc_stderr": 0.014758652303574878 + }, + "anli_r3": { + "acc": 0.3408333333333333, + "acc_stderr": 0.013688600793296939 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.3335687382297552 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + }, + "hellaswag": { + "acc": 0.48028281218880703, + "acc_stderr": 0.004985900172317698, + "acc_norm": 0.6314479187412866, + "acc_norm_stderr": 0.004814261966376849 + }, + "rte": { + "acc": 0.5090252707581228, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.5682715074980268, + "acc_stderr": 0.01392087211001071 + }, + "storycloze_2016": { + "acc": 0.7215392838054516, + "acc_stderr": 0.010365521460604413 + }, + "boolq": { + "acc": 0.6180428134556575, + "acc_stderr": 0.008497851998427192 + }, + "arc_easy": { + "acc": 0.6102693602693603, + "acc_stderr": 0.010007169391797051, + "acc_norm": 0.5538720538720538, + "acc_norm_stderr": 0.01020005782876501 + }, + "arc_challenge": { + "acc": 0.26023890784982934, + "acc_stderr": 0.012821930225112566, + "acc_norm": 0.3003412969283277, + "acc_norm_stderr": 0.013395909309956997 + }, + "sciq": { + "acc": 0.853, + "acc_stderr": 0.011203415395160336, + "acc_norm": 0.773, + "acc_norm_stderr": 0.013253174964763921 + }, + "piqa": { + "acc": 0.7633297062023939, + "acc_stderr": 0.009916841655042809, + "acc_norm": 0.7665941240478781, + "acc_norm_stderr": 0.009869247889520986 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_1.csv b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..f24079b092140b0a1cba54a80fc3191db648c4f4 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.305,0.014566646394664387,0 +anli_r2,acc,0.317,0.014721675438880213,0 +anli_r3,acc,0.335,0.013630871843821477,0 +arc_challenge,acc,0.29436860068259385,0.013318528460539427,0 +arc_challenge,acc_norm,0.3097269624573379,0.013512058415238361,0 +arc_easy,acc,0.6195286195286195,0.009962305992058584,0 +arc_easy,acc_norm,0.5904882154882155,0.010090368160990062,0 +boolq,acc,0.6314984709480123,0.00843719989350296,1 +cb,acc,0.5357142857142857,0.06724777654937658,1 +cb,f1,0.37216374269005853,,1 +copa,acc,0.76,0.04292346959909283,0 +hellaswag,acc,0.4765982871937861,0.004984313205791443,0 +hellaswag,acc_norm,0.6290579565823541,0.004820697457420433,0 +piqa,acc,0.7627856365614799,0.009924694933586376,0 +piqa,acc_norm,0.7584330794341676,0.009986718001804444,0 +rte,acc,0.555956678700361,0.029907396333795987,0 +sciq,acc,0.905,0.009276910103103322,0 +sciq,acc_norm,0.876,0.01042749887234396,0 +storycloze_2016,acc,0.7172634954569749,0.01041380648612127,0 +winogrande,acc,0.5816890292028414,0.013863669961195904,0 diff --git a/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_1.json b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_1.json new file mode 100644 index 0000000000000000000000000000000000000000..7e592762fd24f0ab366ef361ee952b6fddb12464 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.305, + "acc_stderr": 0.014566646394664387 + }, + "anli_r2": { + "acc": 0.317, + "acc_stderr": 0.014721675438880213 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.013630871843821477 + }, + "cb": { + "acc": 0.5357142857142857, + "acc_stderr": 0.06724777654937658, + "f1": 0.37216374269005853 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + }, + "hellaswag": { + "acc": 0.4765982871937861, + "acc_stderr": 0.004984313205791443, + "acc_norm": 0.6290579565823541, + "acc_norm_stderr": 0.004820697457420433 + }, + "rte": { + "acc": 0.555956678700361, + "acc_stderr": 0.029907396333795987 + }, + "winogrande": { + "acc": 0.5816890292028414, + "acc_stderr": 0.013863669961195904 + }, + "storycloze_2016": { + "acc": 0.7172634954569749, + "acc_stderr": 0.01041380648612127 + }, + "boolq": { + "acc": 0.6314984709480123, + "acc_stderr": 0.00843719989350296 + }, + "arc_easy": { + "acc": 0.6195286195286195, + "acc_stderr": 0.009962305992058584, + "acc_norm": 0.5904882154882155, + "acc_norm_stderr": 0.010090368160990062 + }, + "arc_challenge": { + "acc": 0.29436860068259385, + "acc_stderr": 0.013318528460539427, + "acc_norm": 0.3097269624573379, + "acc_norm_stderr": 0.013512058415238361 + }, + "sciq": { + "acc": 0.905, + "acc_stderr": 0.009276910103103322, + "acc_norm": 0.876, + "acc_norm_stderr": 0.01042749887234396 + }, + "piqa": { + "acc": 0.7627856365614799, + "acc_stderr": 0.009924694933586376, + "acc_norm": 0.7584330794341676, + "acc_norm_stderr": 0.009986718001804444 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_2.csv b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..52ec67c040c5352f117b62adb6bdc21c1dfd0f71 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.309,0.014619600977206493,0 +anli_r2,acc,0.325,0.014818724459095524,0 +anli_r3,acc,0.32916666666666666,0.013570806258433625,0 +arc_challenge,acc,0.27986348122866894,0.01311904089772592,0 +arc_challenge,acc_norm,0.3191126279863481,0.013621696119173304,0 +arc_easy,acc,0.6292087542087542,0.009911292822056923,0 +arc_easy,acc_norm,0.617003367003367,0.009974920384536482,0 +boolq,acc,0.6305810397553517,0.008441557531799614,1 +cb,acc,0.48214285714285715,0.0673769750864465,1 +cb,f1,0.3338164251207729,,1 +copa,acc,0.79,0.040936018074033256,0 +hellaswag,acc,0.4766978689504083,0.004984359669951929,0 +hellaswag,acc_norm,0.6308504282015535,0.004815882719278398,0 +piqa,acc,0.7611534276387377,0.009948120385337494,0 +piqa,acc_norm,0.7665941240478781,0.009869247889520993,0 +rte,acc,0.5054151624548736,0.030094698123239966,0 +sciq,acc,0.902,0.009406619184621252,0 +sciq,acc_norm,0.885,0.01009340759490462,0 +storycloze_2016,acc,0.7252805986103688,0.010322309878339504,0 +winogrande,acc,0.5832675611681136,0.013856250072796318,0 diff --git a/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_2.json b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_2.json new file mode 100644 index 0000000000000000000000000000000000000000..37a754bad192d837abdfecf6c7ac83086bf29225 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.309, + "acc_stderr": 0.014619600977206493 + }, + "anli_r2": { + "acc": 0.325, + "acc_stderr": 0.014818724459095524 + }, + "anli_r3": { + "acc": 0.32916666666666666, + "acc_stderr": 0.013570806258433625 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.3338164251207729 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.4766978689504083, + "acc_stderr": 0.004984359669951929, + "acc_norm": 0.6308504282015535, + "acc_norm_stderr": 0.004815882719278398 + }, + "rte": { + "acc": 0.5054151624548736, + "acc_stderr": 0.030094698123239966 + }, + "winogrande": { + "acc": 0.5832675611681136, + "acc_stderr": 0.013856250072796318 + }, + "storycloze_2016": { + "acc": 0.7252805986103688, + "acc_stderr": 0.010322309878339504 + }, + "boolq": { + "acc": 0.6305810397553517, + "acc_stderr": 0.008441557531799614 + }, + "arc_easy": { + "acc": 0.6292087542087542, + "acc_stderr": 0.009911292822056923, + "acc_norm": 0.617003367003367, + "acc_norm_stderr": 0.009974920384536482 + }, + "arc_challenge": { + "acc": 0.27986348122866894, + "acc_stderr": 0.01311904089772592, + "acc_norm": 0.3191126279863481, + "acc_norm_stderr": 0.013621696119173304 + }, + "sciq": { + "acc": 0.902, + "acc_stderr": 0.009406619184621252, + "acc_norm": 0.885, + "acc_norm_stderr": 0.01009340759490462 + }, + "piqa": { + "acc": 0.7611534276387377, + "acc_stderr": 0.009948120385337494, + "acc_norm": 0.7665941240478781, + "acc_norm_stderr": 0.009869247889520993 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_3.csv b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..569304c6e983172e1035c6817931158436fbb8fd --- /dev/null +++ b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.304,0.014553205687950446,0 +anli_r2,acc,0.33,0.014876872027456727,0 +anli_r3,acc,0.33,0.013579531277800922,0 +arc_challenge,acc,0.2960750853242321,0.013340916085246268,0 +arc_challenge,acc_norm,0.3216723549488055,0.013650488084494164,0 +arc_easy,acc,0.6321548821548821,0.009894923464455191,0 +arc_easy,acc_norm,0.6275252525252525,0.009920469215736012,0 +boolq,acc,0.6388379204892967,0.00840115419524237,1 +cb,acc,0.5178571428571429,0.06737697508644648,1 +cb,f1,0.34887334887334887,,1 +copa,acc,0.78,0.04163331998932262,0 +hellaswag,acc,0.4751045608444533,0.004983592410934173,0 +hellaswag,acc_norm,0.6331408086038638,0.0048096267236268486,0 +piqa,acc,0.7595212187159956,0.009971345364651073,0 +piqa,acc_norm,0.7676822633297062,0.009853201384168243,0 +rte,acc,0.5487364620938628,0.029953149241808943,0 +sciq,acc,0.911,0.009008893392651526,0 +sciq,acc_norm,0.903,0.009363689373248113,0 +storycloze_2016,acc,0.72367717797969,0.010340939873166822,0 +winogrande,acc,0.5943172849250198,0.013800206336014201,0 diff --git a/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_3.json b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_3.json new file mode 100644 index 0000000000000000000000000000000000000000..e72c5a5e73f86abdff75d287084642e5b4190845 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.304, + "acc_stderr": 0.014553205687950446 + }, + "anli_r2": { + "acc": 0.33, + "acc_stderr": 0.014876872027456727 + }, + "anli_r3": { + "acc": 0.33, + "acc_stderr": 0.013579531277800922 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644648, + "f1": 0.34887334887334887 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932262 + }, + "hellaswag": { + "acc": 0.4751045608444533, + "acc_stderr": 0.004983592410934173, + "acc_norm": 0.6331408086038638, + "acc_norm_stderr": 0.0048096267236268486 + }, + "rte": { + "acc": 0.5487364620938628, + "acc_stderr": 0.029953149241808943 + }, + "winogrande": { + "acc": 0.5943172849250198, + "acc_stderr": 0.013800206336014201 + }, + "storycloze_2016": { + "acc": 0.72367717797969, + "acc_stderr": 0.010340939873166822 + }, + "boolq": { + "acc": 0.6388379204892967, + "acc_stderr": 0.00840115419524237 + }, + "arc_easy": { + "acc": 0.6321548821548821, + "acc_stderr": 0.009894923464455191, + "acc_norm": 0.6275252525252525, + "acc_norm_stderr": 0.009920469215736012 + }, + "arc_challenge": { + "acc": 0.2960750853242321, + "acc_stderr": 0.013340916085246268, + "acc_norm": 0.3216723549488055, + "acc_norm_stderr": 0.013650488084494164 + }, + "sciq": { + "acc": 0.911, + "acc_stderr": 0.009008893392651526, + "acc_norm": 0.903, + "acc_norm_stderr": 0.009363689373248113 + }, + "piqa": { + "acc": 0.7595212187159956, + "acc_stderr": 0.009971345364651073, + "acc_norm": 0.7676822633297062, + "acc_norm_stderr": 0.009853201384168243 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_4.csv b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..31b19c74f9cc8b8549621376fe2f2c62d593ca0e --- /dev/null +++ b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.312,0.014658474370509005,0 +anli_r2,acc,0.332,0.014899597242811485,0 +anli_r3,acc,0.3258333333333333,0.013535422043417464,0 +arc_challenge,acc,0.2935153583617747,0.013307250444941127,0 +arc_challenge,acc_norm,0.3148464163822526,0.01357265770308495,0 +arc_easy,acc,0.6346801346801347,0.009880576614806924,0 +arc_easy,acc_norm,0.6292087542087542,0.009911292822056918,0 +boolq,acc,0.637308868501529,0.008408838061823179,1 +cb,acc,0.4642857142857143,0.0672477765493766,1 +cb,f1,0.26842105263157895,,1 +copa,acc,0.79,0.040936018074033256,0 +hellaswag,acc,0.4759012148974308,0.004983982396187366,0 +hellaswag,acc_norm,0.6352320254929297,0.0048038126319949696,0 +piqa,acc,0.763873775843308,0.009908965890558211,0 +piqa,acc_norm,0.763873775843308,0.009908965890558218,0 +rte,acc,0.5415162454873647,0.029992535385373314,0 +sciq,acc,0.914,0.008870325962594766,0 +sciq,acc_norm,0.914,0.008870325962594766,0 +storycloze_2016,acc,0.7231427044361304,0.010347112890276924,0 +winogrande,acc,0.5974743488555643,0.01378286683170305,0 diff --git a/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_4.json b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_4.json new file mode 100644 index 0000000000000000000000000000000000000000..054742e6c13d96191e0febfb3898599aa6e595a6 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.312, + "acc_stderr": 0.014658474370509005 + }, + "anli_r2": { + "acc": 0.332, + "acc_stderr": 0.014899597242811485 + }, + "anli_r3": { + "acc": 0.3258333333333333, + "acc_stderr": 0.013535422043417464 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.26842105263157895 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.4759012148974308, + "acc_stderr": 0.004983982396187366, + "acc_norm": 0.6352320254929297, + "acc_norm_stderr": 0.0048038126319949696 + }, + "rte": { + "acc": 0.5415162454873647, + "acc_stderr": 0.029992535385373314 + }, + "winogrande": { + "acc": 0.5974743488555643, + "acc_stderr": 0.01378286683170305 + }, + "storycloze_2016": { + "acc": 0.7231427044361304, + "acc_stderr": 0.010347112890276924 + }, + "boolq": { + "acc": 0.637308868501529, + "acc_stderr": 0.008408838061823179 + }, + "arc_easy": { + "acc": 0.6346801346801347, + "acc_stderr": 0.009880576614806924, + "acc_norm": 0.6292087542087542, + "acc_norm_stderr": 0.009911292822056918 + }, + "arc_challenge": { + "acc": 0.2935153583617747, + "acc_stderr": 0.013307250444941127, + "acc_norm": 0.3148464163822526, + "acc_norm_stderr": 0.01357265770308495 + }, + "sciq": { + "acc": 0.914, + "acc_stderr": 0.008870325962594766, + "acc_norm": 0.914, + "acc_norm_stderr": 0.008870325962594766 + }, + "piqa": { + "acc": 0.763873775843308, + "acc_stderr": 0.009908965890558211, + "acc_norm": 0.763873775843308, + "acc_norm_stderr": 0.009908965890558218 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_5.csv b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..08a4774adec3a000c5e28ca18efeed426abc4556 --- /dev/null +++ b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.316,0.014709193056057114,0 +anli_r2,acc,0.341,0.014998131348402704,0 +anli_r3,acc,0.3375,0.013655897185463657,0 +arc_challenge,acc,0.2960750853242321,0.013340916085246266,0 +arc_challenge,acc_norm,0.32081911262798635,0.013640943091946528,0 +arc_easy,acc,0.6342592592592593,0.00988298806941883,0 +arc_easy,acc_norm,0.6321548821548821,0.00989492346445519,0 +boolq,acc,0.6394495412844037,0.00839805483449795,1 +cb,acc,0.5178571428571429,0.06737697508644647,1 +cb,f1,0.3271557271557271,,1 +copa,acc,0.75,0.04351941398892446,0 +hellaswag,acc,0.47540330611431986,0.0049837401452186075,0 +hellaswag,acc_norm,0.6369249153555069,0.004799034356969407,0 +piqa,acc,0.7546245919477693,0.010039831320422396,0 +piqa,acc_norm,0.7616974972796517,0.009940334245876224,0 +rte,acc,0.555956678700361,0.029907396333795983,0 +sciq,acc,0.92,0.008583336977753655,0 +sciq,acc_norm,0.91,0.009054390204866442,0 +storycloze_2016,acc,0.7247461250668092,0.01032853840050057,0 +winogrande,acc,0.5832675611681136,0.01385625007279632,0 diff --git a/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_5.json b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_5.json new file mode 100644 index 0000000000000000000000000000000000000000..72c292a753639c8ada230af18822657c8e5d772f --- /dev/null +++ b/4b284b84bc4seed1/evaluation/rankeval/4b284b84bc4seed1_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.316, + "acc_stderr": 0.014709193056057114 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402704 + }, + "anli_r3": { + "acc": 0.3375, + "acc_stderr": 0.013655897185463657 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.3271557271557271 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.47540330611431986, + "acc_stderr": 0.0049837401452186075, + "acc_norm": 0.6369249153555069, + "acc_norm_stderr": 0.004799034356969407 + }, + "rte": { + "acc": 0.555956678700361, + "acc_stderr": 0.029907396333795983 + }, + "winogrande": { + "acc": 0.5832675611681136, + "acc_stderr": 0.01385625007279632 + }, + "storycloze_2016": { + "acc": 0.7247461250668092, + "acc_stderr": 0.01032853840050057 + }, + "boolq": { + "acc": 0.6394495412844037, + "acc_stderr": 0.00839805483449795 + }, + "arc_easy": { + "acc": 0.6342592592592593, + "acc_stderr": 0.00988298806941883, + "acc_norm": 0.6321548821548821, + "acc_norm_stderr": 0.00989492346445519 + }, + "arc_challenge": { + "acc": 0.2960750853242321, + "acc_stderr": 0.013340916085246266, + "acc_norm": 0.32081911262798635, + "acc_norm_stderr": 0.013640943091946528 + }, + "sciq": { + "acc": 0.92, + "acc_stderr": 0.008583336977753655, + "acc_norm": 0.91, + "acc_norm_stderr": 0.009054390204866442 + }, + "piqa": { + "acc": 0.7546245919477693, + "acc_stderr": 0.010039831320422396, + "acc_norm": 0.7616974972796517, + "acc_norm_stderr": 0.009940334245876224 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc8b5597576739a680b2310234d29d05dbd656c9 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:348eace5e735ba014234171ddf32c879c0ee761e125a388c4472852e07107f56 +size 199058647 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ed9781c9e93d22174d25c57f9986f888201f4c5 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d97cefd39d4d46475300abbbb3afd3aedbc60e36d83d2e9d41e5cd2adf33468 +size 199058647 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a1709c6de2d96476f9c0fe06de8adb7798cf3f9 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0209dffffa22db82914e7a51d330b0e8da64b84e3f3fe94690f8a55fa7e1ebe4 +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e120081fb0f8fc80c92ace308105c19c2d89c5bd --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c3d6c41529f0aab6c7428d2b6cb81b4a5a5d04f97ef4c3a71c131e840963c55 +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c598c5ac6ee0613d4b63f1c39f6cade89d72f6c8 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d345768b4632ba0103167be2936efc6fb15f04f65ce6839b0cffce6a53e0b0db +size 199058797 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01fa570799932f4be99e2db318a478987e1d1076 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9842f80fe046b3a55752938dd654e10b90c56b3a23aa105018636594446f8681 +size 199058797 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08a417a2303985b185b8ea15c5d83bcfd7d33e0b --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763161d20e34ba333a8d3ff89d13670e5d61e26de62e715d7668803dd4e951b4 +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29c5e9b7178756f755faf15bc3e3643c8cafe148 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e67de47ce9ae80a562734353712e5a9c7fed7f339adf6561906e86474bd123f1 +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03b4a012a7818ec68f69d1e76705d57befcde75d --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bd9ba2afecc80d0f74b9b378ddd3c5b15f26538b703a2bb41b0041506d3488e +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e4ccb8a4fcdd59c0a0dd71421cd9672bdbb4ada --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2b807f43feee424d5599d49a7431d321411eacb730cefc4b31e64c4b3f7488e +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a601088695a488e9a296408f3c0a3cdcd7852d4 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:801548d8d49af5d7f8d6264f2aac8a34957d56b315bf726ad6b187b89d413c35 +size 199058797 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d3b6a443c44ce5c8b5a929f7f74b842ba3742bd --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f33294fc68d9785a98e32af0278f8fa9d65dc4b10d29e661f96e658cc288ae5 +size 199058797 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69b1c391a215cca0dec7a13300b1b11174dc6201 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47f57c39dc48dffdf917c7211d5d21c90d54983e5a43dae51dc32ba1c50e9f7d +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..161ad1da312e1d7b2b0f00e7d1b1ae181f829ecc --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab345fd2351c21afcd3edd1c816d2c336638ac3622143f0a57f41095ef3c0de7 +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22ab093f43d16466e337bb3db843578e13f7a208 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d595425f984200fe18627dd79cdc1235a3a722b96fecd533f164ce16fef442c9 +size 199058669 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6173173eff038b4b3a7bc0aff6078f7277672e07 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fbc33cb46aa517aad18be11461aa6ee806588ec6ba830400378ba5514433f22 +size 199058669 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04b7d3190c8dcc5be65ccd832ca8d478e22d59fe --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb93437c2450274c20cc3939cbffa7d44384e0e2a3f14b7dcf4db3e344ea64ac +size 199058797 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..230760420fd4c552db554ad7f55a459127bfe407 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fffc2117be940493faac269f6bca07f5c16820ce9c844dd41d1b30bd41b3db3 +size 199058797 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceb7b5ec7d1f7efc68b856051718c9f1d872fa16 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:408e28a3758d0cae64f70fc0ef4934541693a9f83aca452f6a9b869dc70e0773 +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..857e89f94baffcbc4751dc8a3cc842c2ae603f16 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59af72b805d83c7d0028694cd4ae2bf6d53ed30037d04605669a433d636f64d8 +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64fa7731c8816fd0fb42bd2b82b02c6150b9e305 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af91af2ec00feaef9a059b8a96a145dd2edc213e19ff6a381f0b0731ea3323ca +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4064a9db9c7703f9c681b0087cdb866c1f4679ac --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74d7beeafc6f9b8475eae907dd4703e9b807b1a9f375e0dc6e3f3b53d19b08fd +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b124f62308e0db527be316c2f9e4be3ee0f6881 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cb2bb079ef0cefa6aa6cc8ae3ca1551a55a826f38f83e7cdd967bd200585b34 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f834e0aebfb879f9681d8a55d5dbf754472c3a59 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b717f947848a392f71591174f1a1d733771649d55deb16e36ce4285a059f2453 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6eb83bfe204a84c20672da958490d5bc7d60ac95 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1de0b41ed9e5523c532627f7690adf76576d7eeb65ec5bc96b37b5eed81cdef7 +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3141ce1eecac96648400301ad5a63c4da00cabf7 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a23efad123136d996aa6f12f52f242956f1c388752ace2f276cc9161176f4edc +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1332800bb862ee7e3bfd3d2a1697db5ed78d2332 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:268b7803ee3926669ac80f425bb0ef8e9197e4734912e7ab02a8c870db36d443 +size 199058797 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3259b82cf4bd5918a354316460b736867a48697 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48c1d52147eca938231c917a7aa994cfba2a63cc6f231f7d725f79d5c9a22e4a +size 199058797 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9d0293fd407ec62c0af907ae7492be7b70a6a8d --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:608a9ecf3154d82aede9a4d7793412314169ec911e70d0dcdce96986f9d372de +size 199058605 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fda23b2fe56852f1bb13f9eb8fc736d8f0b2667 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd0511329165c3ab2e007b494234ca59c16ea125c13546a13c9c625064614301 +size 199058605 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0ba24b5440922b185e1ac2f2d84fbabcab3e1e5 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cb2b9f16050411633dfbaea8a864bfe61a04b7e656bf19b83ffe4d12c38fc71 +size 199058669 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..669ecb0ee3a422b8dbd0d2736a460f753b871883 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:482eff3687742518d21d3640b4e515a4f21032e7fbcd5e289cd138fb0ae3eec3 +size 199058669 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4f80d2ba4050eec2f8e5010365850fea1c135ba --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8418b00475b808ea3a36e0d03272d5787141891d3ef1d55ba4c0fe5f4581684 +size 199058797 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12365855e2e5291ca8fa0b7a08e8f355c389abbf --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79cb72c3f1a8f8550bccead4f6a416ef8b722884edac14597e6a39f590566b9e +size 199058797 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6278729e6690cb0c4a36a8bd88081a48b7931257 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d51e0c914772ec98362c25810ed6a531cb11ee52dd4bc8e00046dc57861fb9a +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..570e21bb1a024be8361fc1fdd31fab8531480e5c --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1b9c1b49f82001f615ec004bc1513cb9810ab709f80c304fa4f63b1d881809b +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22ece4fe6be56a11ccbf2c0e28cb5faa61ae747a --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbc2d0f2c2de78fbb2238e90471d316829db867fcf355c6bb6318f4080bd3218 +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e81403094b1bc27b3831cf2bf4a3dd9c3b2ec172 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:893abdf7c5e26f4731c6288c527d5d5f0a81256135f5043fe86a566a7602687d +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85e6cdfe42ea633ea4395d7b5bcbf0bf9b524412 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:898b7c418112c05cbee4bc0c93ab9781356e62511f14dfc2a3500372c589af8a +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17bdca982b51cc1185be212d76a63767d229829a --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d44b8200526792e7f84df68acb4d9ecefce35ac7ebcc863875c0ade139ab5d96 +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc494c017295c57bce06b549b9226ec7ca34fa35 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80fbafdd36afec846f1cf0c3d9c649122476d442b65f4e9872a0f0fd76b9821c +size 199058797 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f71e70f8206b0af6bcff38fb4c334484e9baf00b --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:353e777dc52d8217d4f632057649e59ef279160606f9a77a76f46de38f08153f +size 199058797 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7d880e30ec9e63f1f86dc7683ff52af51244fcc --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46da35b5edd98cdcce6acb900cd87656d171c6c375f744c84a31d6d4f25b20b6 +size 199058669 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ddf2b3bc72fe439f0fa16cda2dd5f0c57638899 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ee1828fcd30a8b70371c4005608756a52a356b35d92308f8b688068a7caa952 +size 199058669 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea826bdbbd6dbf4c144871f563fe9bb80982ed54 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9ba3a267bc27b1560eb88eb86714454983d143fb4b15fe472f8b477f35f364e +size 199058850 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdac3e09c54cd36717cfd4026de419d4bf2d0980 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f423c2da4efa7185220d5ca416d6ae59e6d0478d2fe6bc033c409d481abeba29 +size 199058850 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ad66d5cb65df7859b43e84ea66306995bf58fdd --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79bde02486cc076b9f75f1fde3b6c4dfe74929c7de298c1cba91f1f9a4804307 +size 199058669 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03b242697030607d08fd09ae91a679aa81f19e2d --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:829b1de1a4f6be9d340cf11596ad164887e8c8aea2288231e71eaffa08dade06 +size 199058669 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c60a698d57721e6d26ecf612535b09a23c3f4e9 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1610496ec921cb26adea1a4f8fc69133d5c9a1c4e8113a8349ccc10f550bce84 +size 199058797 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63074be3e7d9084654e6db542d6f207f638b46c8 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dab5eadbeee1e481703f500206442d9aeeb93fce41aad459da0e7f475a10278 +size 199058797 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a970507498acea4cfb3b74e6250a1e54c43c49b5 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bc8ca3b36e341c0c266c3207f364d06c45275383016dd0560b886a3e2c1aa02 +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b93d2754cbb76d2466ba09a71373a93c754d6c53 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f31382003249b0eec168b920f0bdce29698f7de2601a0e6660cec5ae117aba +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2a72c2cff73b4c2594dca819f22073711b2aca8 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dd8a3ed944ff97581585aead42e30d58de5626f8ac395feb633aa978f396466 +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ebf1961cd62e0eff5e4aa65490876ca1dcd8bb7 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21b438867b60e75b82fff07311c8d30c106f4c62c27bbb7c092147851bac750a +size 199058733 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76ab635ff0b3bae8b27bebc875c53f18d05fde52 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3ed34620d339f49dcff626cda791538d3f1c5b64b16f0c7f0c00b8d1e4b9680 +size 199058669 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8765eb9cca27c6ddaac83a9667197038103fe152 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:197f009680507c86e7da4d344b7e1b9bf0d4bbbcf0ba7e696e737ae36b91bb7d +size 199058669 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf30807ba388342f1e9401448b608c75a7832997 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec787dec9511ca096f4ccb4b6a630f1cc88b4a1a304c891864373c7ba760bb70 +size 199058925 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..901e58316b7b059acf281d061dca46cd0acf2dbc --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db8daf852d4123db7f0d370db8f37cdf9446f714d1e2f243a4474bbc426b2785 +size 199058925 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9c9afcfe963bde6a6551f42c43c113b6210716c --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43e36029b7404008d95947920c415eb58bd420d507b9580a075b27627a0cd6a4 +size 199058605 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05158488dfbb70ff0b72e81b9ef70f933bfc1327 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3232297e1522a8770c28e998f7617fc56e2a3eb436a33641c79e38dd2e04ee8b +size 199058605 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a3855af17d474b3663181291c0c998de0f2587d --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1ac2d085814c2725d29bfae1102047fd5b39805810a56da8971ad00dd75adc7 +size 199058605 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d69c264661369b720345f8b4a76f1881bcd1f1c --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5577c769df742cc928038a74a276417ab3c40517f97fbb3884c5391ea9cbf41e +size 199058605 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..926661e9264536a545e7c15c497323179545d1ba --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9bfab271b8dcbf51ef37adc041bba3cda4799f8e1d408d46acf75c25fc5d787 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30d27249eb1499381524482d9c1d113fb3e99328 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ac090832b196d1b599f27ee10cac936af98c86c680ffe148c653a93e92b38b9 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea49aec546e6d33ea276bae56c0180d83e28dc74 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:188042558c0571ba6c1b530cd6b684dfb14893506eed0ae6fbf6ee53d93c67e9 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed9cfec5a49879b9dab40ab71303f1a7c039bc07 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea73837f40ef513177baec44675b273aec30f55496685472fdcafab12ce0e6c8 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6887b3f5e182798dc5bd8f20d513f8b148c695f5 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0200935e247ce4a5e4e296a44b4559fc742aa71e45fa8a20c1d994cc8ee7a07f +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da4ce3af79bde9d7ad9ff404b2fdcfd837b4745a --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:657be3a0c9795204f7534c107695c011563def819ac1ccb8acb424d92053245d +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c85798104ef27515cdb3deef874e755f741c3dd8 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b9d1f2069dec740b24010f9f1149c6edf13072d1892bf2846964ff82d54bdb2 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8824a626b57dc9c51c5c1528e8fe9b661daeaffd --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00e705430b57de366562634e210c7d57aee7116cfacdd7fb1b358525e6e4fefb +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c0b028fa77fde4e9fd6269148ec9142d613f969 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30b47f1b901b702cfb12d68fa6dad40dd38f021a3ad52af50feb4a04e71ba90b +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46636810ec47d4758987c324e1f308f9909dd28a --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70e1aed37c1ed857fc6d39d257188fde1c685b36da93bcf565dc9ce518950b17 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf988d36a8bc8745902c14fa8a09fa330b9fcc78 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77d7ce58a46558a6f1107ce9e0be5f25ed915e00fc240c782f85ee24a91f66ec +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d1c890699929aa11b8b21f75607a56bf7ab7e47 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a16e305c760a19bc0474db4eb3febfbf240839f4434c887efe51858d3b3097e1 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..918270b241e5d540408bfa33f073a77ba9654d2e --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0996567a8e0761a6fbfed81f88c2fb3dae2f4f58a630bd9b4437ef6de8e9d4d +size 199058978 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d40a245e903a2063b052e1d0a4b2f950175da847 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0791303f66b1329ceb98ff79f9a25330e070279736ab1f2c0dca0823fee65b49 +size 199058978 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f85c3a566758bc084a102de2dc0498ac715515b --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa6813b2f28edb4798785e3b73b58e709e151582214dd1dba9bb742483748383 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4024d76551d0b4968079dd438df6f4d5e8dca6d3 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a62ae1004d9e16070d5759682e69e3c7fba9e9fb1f122f128534fd55c272329c +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc1e16402cc68a1e52c319a30adfcb12228505da --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f4f650d3a0bdb0b27ec0762673d4fd1d41af96db72ea0d1d0d5bcdbd524ed64 +size 199058647 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..145001d6fa2796b66a4d206d371380d5768b9db5 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1e8d60ffe595068f5fc78726427a75ad5b5a1fae01a2aea6c678abb957fc9f3 +size 199058647 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df8384065f523b9e94e41fee8d35048cae3422b3 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa34a877a0ed3b649f7f16b835c77a47a8a1ec487156c014444bdde97db1130d +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be01dbe87f5718b433d50997aa58211ed460b2d7 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aacc96ec1908e1b665c775e77ddf788bbdab42aee3a60ebc56e0a7dadd85706 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9217fb37cda45ee99be82bdc4a73f243b846a3f3 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2de3b491aada05a734ea109fc164bbf726738b915c3f0407126c1d32d109d78 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e15dcdc9df0343e3609599a9c7ede5cd3953b064 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc1a52e3767a8f748e64ba3a5b39706cee217c98d4d40cb9ff10064859d5e561 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4264046552be53e2372245ab02adf78b9e5516d2 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad4ea29cd2f8ebe89b049984d5daf0b971ba2870deb5063b6133ccc8633be683 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..edbfcd9d558699336d842b42a5ceb61e29b10071 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d27d38b3d9e234214719975b86c333307cbfe844d60dcc757afd4a7bfb708751 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e74c3df0e715deec1a3527a30e3e59c7f97cd7a0 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e5fdcd13ea720aaef59a75763808bafbc09cb9092df071c25f6f0222d9b76d7 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8feafeb7aa0875b38d6263a3d5cde47a40c8c808 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:707569f2dee5e40c4e45ce53b740e70a636576329fb72019fc2004a423f1a0f4 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c502fab6860f9dfee3cc14cfd96c2cc886d9e85 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f70f44fa6447c93586d0fd02d4ed67d30e2147f34cc5f3eec645092448dad7d5 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd047ed01fb642850b45332a5fb7eb8bca369746 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dffa1a3225c54715826892216ee9e4ff0772a748b3550cdbd2182e10ae6aa694 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cba830f6f3477fb2d9fdc8f223ca4ac845448491 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8565fc237b8d5b1704f5a3a2f23c2feea2c4aa69b1c564d6568bee931ad430be +size 199058850 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..decf013d0d5b35c0ef7b93d87d6de6ca7fdeda45 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06a629cdd6083f4f6d328ba8193e40e0de28c30c0a09eae603cc31a262d55323 +size 199058850 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae6479bf70a5b695c56bc567f0c1c612597ed80e --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7e8535ba603332a7a9dea73e058ba66e065532f36028c79f8319b773def9224 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c309a3bc348b82ecf61359588c3c29d89bb1362e --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9c254458e04e05de272854f8c57e883dd35857dcf823e7cdab3c2c7bffbbd7e +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80c81a09ccfb211eadbbfade6dcac61fd8613976 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b14c173d5aab9d6fb61eced7bc858c851ffeeda2d1f9a34a9e3b9bfb181f9998 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b81335add643b8d369159e992914adffc2e71e54 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0f2e4c9fddc018b99d6ff92c67847f3608ef74b3b71d5c7a48b58c124be6bd8 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ac6bb30ba46c95172fe0c3cc22fdc9cf93203af --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76e4c2081c9a8ee9e50ba03029fb35e872dba79a394aa8d5bacdfb5152facb6d +size 199058594 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09e7ceb20a2f54fa2cb1a0fa7d1ac512a08ebf3f --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:794644cc4a1bfa3ef3d84ceda88134f2fc993f323939ac6b05a5598d758b8552 +size 199058594 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aadb642e4af4ec89c5e69cd89fe9de309bbfc4f --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f9f626432fef6e5c3563589fdacc48c5d1ce28ed3f8ac5bc267b885aed01e50 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a301889e03262c384261553cade7dce885fd47c7 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0b994b6b350b341eabc11402cb21b4fde7501d2da33c7f0a1a3b915001b981a +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..124ef723d522be32da06abb746b6893b3d0f7ddd --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a84a47e08c2184eeca43dc41fde85b6aed70f143fb88cdd0fd9a48c6f68c26d7 +size 199058711 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e6b5903f933c544efe31fb983580c9562c770b9 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98cd448e2032c44bf42ee8d3eb31bc48feda540fa80c8cf469bf8cf72eab367c +size 199058711 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f94434b99b7e4eb6ef6bb25773b413d7571a6f39 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da9583716b72a36a27f64d14d87cfed660c1299482d51a75efcde66085d3987d +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd384b0baab3ea891914f41e287a0ae1e95ef721 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fd9236fc04c4bdd2154235160cbbceb7cb203e0f81f9c2c1353e124e657ef91 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07ceb14f47be53c89b19895bbe2a7b08381c5814 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d15fd193d1211a48e6a5f4dd09ebd9482423886f752ff3ffab4e89111a754ea +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..163f146f64826bc179bbfbc3b4882aa09d53bd57 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a74e0f5be4b45e00f19a0fa62b7271a801ce8e046829b60dde5da5655528ef4 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a778d0f424c0cd371d77069f823c1dbfd745586 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7720af442d5b3e2367e9f19ebe9bab05fcb7d46756a9f0d10ac240329b979b91 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3fd8a5f1ef6450500d2017f96e075888e16eb2f --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb66b57519988acb6148353d4bf2ab5a258f622feb197ebe3ccf3452c81a020 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ca8b7d809580599a0b1cd4e42fb2ee128b8cc05 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f8ba710baff9760e1f71a81273a8a5f87bfa1e47fe3c37244ad1c9bdb2b44e5 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a76c1b778a05d08074da15a5c00f9520ea38545 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c52af1744ef6fd35b7621de35c14afb4c9eb0f3245336f09aa5d4c0261de885 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4169b6edb10a7fbdcd0bb506e48f02aa6a94f6e --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08110e3e903e069aeca7b3e97dfa7bf4d362e3682d4df908e21c7681625d3d36 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..389b428b8e8f81123580c803c02cd111b29617e4 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99ecfa95ed9d1c4951eb0e02f734e3b7f9c81c1fd3ad3166d45b9b46b4959655 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c13eae22924ddc1d15acd50ce76e3ef52b5767a8 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3550ad3c789573d791ed54689407d9e6d9931823a5b7c603c7e52a109bef1c7e +size 199058594 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..534f9e2f3efac005fc478d1788bcf760ed1abc84 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5846eca483294d9a5fa91a01aa073826c185016f07dc6bfdbd7ab76b686e077 +size 199058594 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37541858d6de3e75d6c5cc881eb5e32dc3d07b92 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:618ab27c66df7478be2db893663efe82140b9c15cce9e1578603fd051149eff3 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b73bda3ac25082351a13aaaf968eafed49c61629 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6776d08c87b696f5f68597daa2e99ced85bb62ccf4aefb1419fed81039a4a6e5 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd20efb15da4ce2820c7f267a79f36e4b1d62529 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebea8e45fe98a1afed1ba688a2f1fdeba374ba39d1d443f1211d16a8400de597 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5d50d525209a09a24618ada2b7001910182d1d3 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c371c77b5919d447a11ce33afb82f919fa244ee1acd09a4e2044626541304263 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..763c5bd35fcda326c0f64abf0bf69fb267c25800 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d09ee79bfa6b19aa05e718a14567d1937a634c26b7bef1201a158a441cddd67 +size 199058850 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0e1383030994098de694e82cc6d3fd564397c3a --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b60571623459aaca95bf298605d0cbbd75d6959ab174da7fe80e006ea7a141ac +size 199058850 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..585303f54a2907de875fbc2af380dd32a133f1ed --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d1bf510ca659bab19be7986e801fcf794de04bfbf4079c606bc4b924f62976f +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3ecc1b7bfdced26dd103680abfa22b88239122f --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba6aa4c337cfa76f68669188f0d5f41a2e740998aa1d02d13f39c13f73f9471 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c815d04732ef3a65dea590d33ad5fbff3e55b17 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:942d1efaa446a3aa0c058f000421076effa20e99625560e62bb68087dab7826c +size 199058647 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b315aaac235252678f937e96e085941e58af090 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d44e37bc6f845ef20411b3484ebe9820ea8cd5bae4aa7153f9d5d496fc7f4e6 +size 199058647 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22019028b1cd260d1fa9ce7d44ddf159414b14ad --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2055265dfdde78a97d94b17a9963b4ffc3eeacd0270f6304684173b31478be72 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d86bb964465a92249c9ab0653ff21a67307dd866 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:957e91ac204bef374f3651559421beab1876b69fae52a22301905a0126ea365a +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..916dac00e21bc03dc81525941fb51114f5de5989 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b77305176d643142f4db84df2e5026482fa45f901109e56d7242c7f5525e9a18 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5109a6e6ef53717d1c7ba6dab2af96a9498e040b --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cefa09bf2fcd02317938c28a6807d617b1c328b702c3c19e0ff66015b309b16 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d312d93817f1b3bec26b670d78b85f33ef87520 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62d6c0b006348aa82b71e611ac3e2b7276574ea802fa8168bf22fcd1d4532824 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da151ceb7a4904c48c1604b16b0ed1c0b82e03a4 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e694cc827850b1c71c1c8e493545577ee7da4df76d0c23ca1d08b76887fed3b +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..101806af12cd94cf66c32e58f83525829740f12d --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:071925f295aa9606374bc65d76b382c8776b1b05d7006c778b889ecfeaf6f3e7 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f184e10c1bdf9d073335ae2995364a412774e60 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa663e701690bffe1af28c3ed600095d0d993c3aea741d794e99187a27c5e5fc +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..781fda1b2541f1a771568bba9d378d1cd843d98d --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dba835e1d85d569beb4bc0437e4dbb34941a5af5e32961add9fcbd8b178c65c +size 199058850 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22adcc2554a7626147d9fe73b366faf1dc130fae --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdb8f6727fe6a886dbb5834ae99ca3b46c940601f5966dd004ab9a24a26654c1 +size 199058850 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c539593b45127a0ea47f03ad8b8224ab308eeed --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3dc5350eaefd3ba824a71613f448a2db3fa86ea51f9bfbd97326abe851964c7 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae23e7eab007555d1e460e0aef3276b6ce01264a --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:314d28aba3073f0bb85ea75f9c11163a1d1b56c6390550e276428bbb5098f610 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8004f116dddbae7355f6acd554ffe0c66d8134f0 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c3a0ae5dce699d4258a5a07a3060d27636ce352c8f8ab22f9e58fcb7558b13c +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99f6a4794364a9766d0632147cb8aa089427f612 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afaf529ab4801517c33db4e59c43bda1a684f7c0c66e38e7ce65e16e991f4a34 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ad08adf8b83b0fbb6ff96af104176708eb774f0 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2aaeec010d5d1c0321a32e21ea3c29979b7316d4c420251c695ff08e3923047 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93c822698ed463e12110d8cd46068e113440c7ec --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2196cb5a40c1f2dd708d885b25f5e9999cf04db1aadfac9bb9ad8b1530b53c82 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9f449b57e6af02804a35debf7dd35efb8ee7cc3 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58ecca5fe828ab323aeb9480b3f6bb856bcce4b4c7a6139b05d577c372a9f592 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..517d899ad98ba00b3ac43ddeb0ca370de0dc8bcc --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46d5c3ea731f4d96fa1c1c671b627922dfe5f09447327d060fcabebd5a4a2fad +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6375805f40310a5aa7e416b057cf7dbb558c64e0 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:531089ec14bfe18c4ddedd6d4d04318d772b81c3121926e29ea1eaf1faf80473 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2f1ad3e652a4edda8a8a6fbbaab53448b7bf1db --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b5a352d03cd8cef99f470509690047e4cd7016fb2d31cd7603f8f54990be37c +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..455b4d96c826e8ef00e7cb25dc6285e0ff847057 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf58a2d0a4e7ec0bbc1efe5b6ac7e04b49304ed7ecd0b92e9135af244e589a5 +size 199058775 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..942073dcd6bafae538c43fe1db18253a19abe44b --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb19b55e1da8baedc2f9b1fbea15dec31bebf916a6353b98021877e37ff2ffcc +size 199058775 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..534a974202d94f2dc0a5ffcced01b0db57308dce --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc5bcb52a31c91e3ecdba8207f43be95861019a7cd04f98c86be2a8dde4069ae +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98cb48e378604dfb62e524ba422f33d946f5bdce --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f1c31d6da1c267fd1151d1b136e06ac39ef78addf51815c758268f903fefc52 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5639f4311685ac690d77e3740e18aa7a9a7b90c --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bdf639ef70ce909a55236c49b9b148cd9a11fb3150f04c3463ba99276e4449f +size 199058850 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..481845ebcd3bd01c6d1933cbc1a6de77778145ca --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7eb22b51d04fd0dd2d50bb4ca6863da035f84dc137949d2302fa9014c62ad1c +size 199058850 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f27afab24e39e2835c8bb0b2bdeb18f3bedeedd9 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebc33e251ac01f1636e465b092aa3870d21b296be6d8a3a9d3640b0b62180b7c +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4be59c2cff7ec46d5248fdde8bc4d612847ce94b --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c93d60fcd0c8a435f63325bf590178ad642bad3bb14e58ec0145c154a470aec +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f96f42173cfda9f66331b6c5f1ac03440cb66e8d --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa640f7363fe0fdb5e8bdbc6df21e9d45f6cc02ed7eba9470291c737fe60309b +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89398867398f04c798d60f2e08b7cbe86155e789 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b004a967e30fa94568617677fe7c17b6233345ae325ef37ca32779d96e3e6856 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18fa26d55ed9d31aa0f811037367e562dd4f9072 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7bda1ad8309cf0ecf240929637eb18e293f4e05e117cb6b094e6249d59c0d7f +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..772bd1b6c536b3f809b13f7e2b65aa4d467f3740 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dad94eefa71ea3baa1226c53d68b4dc2103b054eefffb6a7a3e60ed559fc12c +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f23b7a6a5b96bed667c2fcddd7f6f4b3b39d7cb --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a3c3bcc9364d8345b5a5b752e299aed3f02f2ca23f0e59f26e1f7429f86e80e +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e3749e5a830f9cd2cf732a2c0c42906f169eca9 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f9e748aad46a57ff54d3cf2c6b7591cd28174a010be23f631e793bbcd148309 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee4aea17d85c40cfc551f0a7d7c500e80ae099e3 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b351f511e915ab73ce96931592e9fd5396d950971c85b4887f372ae1ec20a967 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3085dbd10d4caf6855044183b486bab40047608f --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37cb86b613c7fbb323cdf7871d935ef79232f2ef1015794b3c4e93abb0a13642 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0dcf0a3d50e1f6564a4c2e324bb407c4a6d1717 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f77757293a9c4c19908de082728a175187d1c1246d96944cfabd84ecf2b96ef8 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6fbfa3a3bce59fe09c931bccd7b168d9c658a02 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:830f26edfd44d8bbae264d61637f74c78f27b860210b68cc98bfe68587f2c8e6 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31311f8f8999890e50b21c3e9cff2e002030166e --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8abf5b584f854e215446523c3dbd00d88584b74f9ddeb0d6e8c4d81e337e8ca +size 199058914 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f98b5895df84e697ff2e5cb61a5d30e780138ca --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b12328404c33d3b090f3d888201636853e292c24e87da5e998508b2f08a4787 +size 199058914 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebf1db0fd99d6be51cac754b8c5ab623c11a9f9b --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cfc7ac91c82410c41516071520698867125aa61071b82058fbc2fac2620f5ac +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a4c4496d7f615928637edc4ad1c15d5f9e58f6c --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37bcfa97d236dda63346ccb36e3276009f4a5191fab7e3c4a583d8ef8befef75 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c898e94f3fa9ad680f9b203b6d16dcbba590255d --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f07d82eaa59999c33dc973ee06e29f3c0b49d80015cb4320e6dce1ecc681707c +size 199058711 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7034073fa1b493e90db4a13eac9a051ce28fd51 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f294c31ecdadf0a14d9f80f20dfdb5e341ab95ac7f6708b1d548f2daf54cb8bf +size 199058711 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..236708cdcf7ac95037a78f2c2f403542e6db03cd --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cae6229b732a946151914e671d6bfb4df2ae639c1b84f61d32422aa7c32ed62 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ba9fc4bddf761563bdaccfd004ef1e9a8c4aeed --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:500214a7ca46e2a64d693d3830ab40447b4a39e2f387dfc407e90198c040f463 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc7705cbfa5aa124b1ed62de2460275c5fd3583b --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2ce26c5759b3fb78962937c365ae16769252ecdf8da4b0abc5d14e7934bf82c +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85345f1af53e897038d0fd3943171c33b4172bd5 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49adde2762306adf28d476d9174c8296f97cba79eabcd0d8b4ad4d25518124d8 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20cf8064f75ad96a4f7103958e0ee2034e26a5cf --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a0b1cca8ebe1b6361cb7621838145a2810814d57cf91bae4fed6ca2f36997fe +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e55859f44917a5eac64b20bd91e101707f4e1c40 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c05312d90e6d5a3a419348c78c1e46ff01178e0d2f915ba71cfd9ae703661065 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bca28b89b7c2b85bb979a69640f04c6e302bd5bf --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62cd92990b336c4d7140b1deffbf419ae12f75aabe391904c2cf6f5246908a24 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd134e3ed76867084c5bd74eb498e78146caea77 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:257ab51e3c9cb5bcb6f243066a579483ef0c387979b78c40ae16e6b4d0c9e33f +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6802229518d22d000ddeaae037f9328b9c81da32 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:087f73e91c75768777955c712e7ace5463489ff19897ca6a73d2896f208ee579 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d09271fceeaa28cb851410cdbf0270a8f403a45 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09c09ce09e61bb9bcf3c15f0d07178fc00052ff41940d4344992a8e612ee57d8 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..283d0b66770d851a8ad73073ed60cefc795e9ced --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72f08dae5032fd85f730297b888f9ef0849e30baf8a09517a52f67c29784d3a9 +size 199058850 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4493dce733172d6a31efcf7976047454b9afb690 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e86951fa6acbefe38eabce71a58a7793574270c7465d95ce64591a25897b07c6 +size 199058850 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f1ba5c85beea7b19cd6ae413d92e6d3b04f28b0 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5541e431794210b5329abba042686b723dbae4e67f5f35e17af438112706e5e5 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4d5e85715cf15b3785bb6b2172b79853b5f1929 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3cca0ad710aafb2cae58893424cf7d142a52070325c5d83f91d83977bef2467 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc886219dcae99ddcff985e1e2201ffa2793a621 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e9bc73ed5b2c69b2512eb13b593a6438daee665e1ade8b648c40705583def6 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d358b69c7a8e4b92b5a4c43528c0888e4e5d258 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5fa8705e123ac1bcee8dec2ba607c5fb508fb925d1597a3e508b5139ed14803 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4abd7b6061c124d4d58c560134fdc373642bc57 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae3ecddeaed326f7e961f34edb252697887059e247c163401416de4d9763698 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6d29409167dd2f6eabadd3627dabf17034904d0 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4005ee6183d0b7f663270786f34fc13e903ed12b681e2c5cc616a08e6f407ed +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca8d20f3789dea9005b7eed1a860d31201f790f3 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2952689cd2b975f997a99a28ea6a703d4b6ffa746ae675da4c8c57f2df6b822b +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..251cc10646d2e0f6befde1970545e592d7350757 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0e8325acc838de2d8706a9d85cd0bee20611c9d67e686661a881dac49bae485 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80953d0c6e1afed756a6dd3dbe0876849e928cbf --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8368bc6ed2ab41106be459dbd74c76bb531279e62f28641b57cd63e8cbd9dced +size 199058647 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf5d3609435fa1348ce927cc700fecd7c68b2737 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24f0850d1c5c0ad1c323f0a7fe3c7d485513e2e76a56e7e6e5f557acbf97cc30 +size 199058647 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5250a16d5c4c59d90ff933b540a923582fadf814 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9e0ca0522b4314a092b9f206b8e7244c2ffa6fa3e2c09af6efd95e1152cea87 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51ebe813b360360dcbb1bc10dd80ffcf2ec345fa --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e4c08d61b06b9f2be4d24ce7078c46295f2a8aa022d0fa68e3d64930457ee2b +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b04043957fa840e78f8484bcd45d1f91c30c9e0 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a92235c0dfa093949b35cbe95c9724eb0eded7c7ac251e7a9bb41ddcf05f041f +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb290c02d1ea79f415be4b98f24fb3f54c01ad1e --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bb9aeddd6bbccb6e490fb724a4f1deff0da459ca5a784519d1a179d5c1f6bcf +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75153024fd7027d229bb1edf7259e04da42f169f --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91ceca6e05eea6321190f6fcf4672eef8c69fc04258328b2043437998f3081a1 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04a46f8f6a2e2c33374124b94d7354ce7ba76f99 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3481b9db357387d85d1d99d7891981bea6f6154a3d390ba3e83a3df01d9517d +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7748cdabcb5d60bd127da270c8253167b17d5233 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99bd132ff17c0820111c83e31fe3cb16a210ebdceeba19e417f1a66c00d2b37d +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2a8baedd9dcbddf011075aca364aa0c5113a9cd --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:266b92b0c9b6c43fdd27a0fd28c45293934c69e252136f3a489e383f777a7183 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2794fe44b6e28a73f8cfff930d61f233a6eb4305 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c348ae98443313338888f85e4e1f572e32593ff237ed0e9fd56c636a4bdcd4f +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab0e924f6e197c3e8d3b3959979e3ba7f6be64e1 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1389167acff0e716e9e78c9f939df4b1d52a79368a1a70cb3ac9dc031612ff32 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a234953b7f4e3eb913e3690d64e48d8970352146 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab8bb1f516e0e7d4157dfd213eb50afadcea8306b860bb4642c1ea1fd829d797 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..786dd9a14dd6c51d3cf68149b3ffd895ea3284fc --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9666f7b8dcf4b06bbfdf02e3e644438bfeda1733b7dea8db8629a19532116e18 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e8dd5f28f1ed8fd941c0006463ffa9f411f3bf8 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3efd5d64d93744c188fd11904e47795e2cab8c689c6e443f99a0d995dec6099 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..431a588636fdf69fc13d94e36fefe2d04dc7aee8 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7636440c3d574fc27b5b7661606dc82ee41f916de65a984486d0bf4ca44227e +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..903f0a7a422af9b1baa817828d86c565645ecf45 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e67567d110894565a24db38f6aee6a916d656533aa71afaccb9ebfd716ba7628 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee8071e0f9a244d495987b054fef21f62a5ee4f1 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27ca4cc5e7e20aa71b59be0dbfc2acb0ef62562ae6b8f31876100b4fc98012c8 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8659dda680b7e17eef72a1785cc5dc8fe5cacffa --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c03149ee3e35d76be014ac2780aec77785d99b1e829fbfc2f44365340a6bc257 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00edf759f2dfa6ff82b49156744aa20807978180 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21b1e903f4ac7a2c4651e2816c70379664e607732911f7153c36519b5c203bd1 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce4729b23544078209e90ba182a5e1850131feef --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65f5486b46ff5349773b243412bb80d4c594a57fbd136d680aeb8611b68f2e4b +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..620436aab745e7e287e2ba8e52eb4d5c2429a6ef --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e05dfea6df0cbcea264ae5723a4ac92276d5ff03cfb55837d42b68a6e5eb66c +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a821b1e810bebd4ee79098d9a9c84d8451382f30 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:927337cb2f2b838d5d5490c0f59c0eecfd82c7d79ab3cd1c92e3dbff74e50652 +size 199058647 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a80eb9a7d534ae0515ade31a8b9b3dc94a0e5f59 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ce2170ed76f0641c4b1959e5d064f7909ad5dc24589630c9ab2942e2a002206 +size 199058647 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55bcf5e10c0ac9ab0894c9c1ebb10f28de00713f --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ca4d4192c513653c594be9529d3a9e6f6140d4abebf34c1c618da37a39bf3ea +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fbb250f5d045a5d6639245a1f909105a2846355 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1caa250ed3c8a9ac25471fb395c34287ad76dc1dc871fbed5bc7e5fcc0c3cfac +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4399bbba50def2fae0a8461553fb5c6c997f202c --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:373701416ad0aa64157424c2d0c09b10e1a17fef17aee4748b91ccc9c90db634 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b469767388a58ab2497a6b5bbbeb02aabc18e604 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae01033b40ae76a4ae97d57ecd4bbdbf3ae08445e56a55fbff9cefc0aa51ca48 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22e203583d2142e40d4c3f35ac12f29d7cb99d3f --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d397ca5e01923c3640fe55a994c3e7cdfe5df1afa21d6dc97f8d6cec004a8af +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1797c17b2234aed415881204a499d7f619af00df --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22132bbc111a3a69ad720751e3d27e54fd3681a229f715945a7d5d02ab14f4f1 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a774a1d61e1fa66b626b27b1319305170da2361 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a5c2e1e0e6882d61061590b90c6c8974e383c970351b2ab7e88c5276c3ae20d +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2776e46b748c012a523688e4bea59103b3743857 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:569cb0f2046062f05a959538ad379e260aeb636b106ec6c3b1060142d9941da5 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8968bfcd29abb13d05ec5bf5312b33ce85cc6b3a --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9cacce61e870ad712da814f67b2f542b6752ec2c9563f3387021cabb3c09531 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9aed0fc895f23fba7cb0ee4952bd7cc09c00187 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6345621d4584971477d9a0672cc8f2d193eb2ab0b7a62456d521e404ce14b857 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c941444d4fea8f94a5dd6537b9da76dd646de93e --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5d7a11017678cc388f289de30a06687dca28901cbb2d66af3b8a4e32f56e94b +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cd17bcc19f5e57b0612061570b4a2182f0641a7 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04256578a1b2fdf4116e5ee738dbf24d7993fa4ae46273883a1aaca1848d0952 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebb9870efc0709729fce3a9e0dd1bbe88d967487 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7cbfe9c43da5e23e9511860695de16c6b9888d10ca85ed64a39620bc51a373c +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1837a0afbd68b491f442aa2df9f8d9036d559f5 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a0933b55ede503529bea69c28802b9664b88a3957bf34d1686abb32d622968 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0e2c479d5d0b2c042205eefae02c6ba5b789aa6 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3ca4e272618999da70305b84091ab7f631c07d25842ad37dfddb4c35482784d +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3681d324d6b20cc15c309ef0add814c1f1e8f869 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92fdf1ce38c6daee6dab68a90d570f10cb1f71b56f79998ccc0fee6d39308416 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aba6e0d2613aac2d3dfa70ad49c51437214ad505 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e053517472ddd2337c4047eba37d1632998b2dfefe2fd2c2a968ec155dd04ed +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b40426c9b4b8c83c58a2507d178cfb616eb6d12 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31b330b17975b8cd7fab55d9371d5dfa62794fafeda5d8ab778088e77d3c5645 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed3a4e6da04db19122fd29d1b136129eea234624 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51ba23a7d5119442bbd8f8354e496382ac7c1e4b08a1c867e12a53b0a87b48ef +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ac526fab0a4dfaa951b7f165c76c3afb930caa3 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71a9646409d70ebced9ceff3f4baf080423ae836e385a7ada36c320fa4928e05 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e105ff0d4340a681cd6e4cbff082503ca338876 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39e9779aa937d486765c5fd1acc1789a39de560b0c81921cbcee9805c79753da +size 199058647 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45f11d39fec11e4aacb5073b4ec3a48310ae7e2c --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c60112a5250ecb7c05be0e78a4f5b3cc7353be639a83a8a2d84ba448deaa56b +size 199058647 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e406ce34d178f3a33f6997be8a67d6f6e6c7ce8 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ded0011cf178ee1f556572c7814beaf9492283298f876b792952ba63bf22d08 +size 199058850 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..560d58b1b27f0c7789076678675d0e7a2ac5179a --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a61808c1b407f6fa8db321ee1062cad5aede10dd8a0123edbb5df4f33b405e6 +size 199058850 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cbd3cdb784a46f12cb778889c66e13c9c3eb828 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3bf545e6d46ceba3defc6be87895bcf97e9e6684f34397e89d43e7f77a0c1f8 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b4b6b8a592b60e2510ecc28115e5b8c1a9b9598 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8564acac89a064583e42a280018b1aabb98bd26c6c04ee6784f2611c1b905dd5 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21b45dd92eb08e31b7b4ae67457227da01c37e0a --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84eea6ba0bbe1995d3d220696b23eb5df298cbdf3e658206e5b4fc3dca53dc49 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14a771d4ab94674db08101c31ee69da8bc782222 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36e8241fccc88feecdc0f0c0495a770e334cfa4da4ca27db46f62d0b74e5f1dc +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a405599c773450a79dc7f902f86b68bbb14415b8 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc0aedafc1c4a61f8d17e185fa4667de768d16cfec6f37d4e983d6610bcd6b16 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18e3cc3e34df7b96b4d28bb21a9e606fed12ad86 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0320e6cc0502a6b8c1c17d440bf2216b91c1f47f741127875f0361ed2f8334a7 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4100f82173fe6d77fbe47670cde35f7c410b4a2 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e33f77a6e22559f799108852a1bb3cacb1c280d8fe8aa83150153269bd46970 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77db596541d6df188e1cb549d3d9cd65ed2de0bf --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:386f9e0457f503f6ec0b6e3c1a53160bca10f60ebd2b9d34d3db21b1c906117d +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eac2699b6a8f70205ffad103ef761abe476e3689 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a153f106c17448fa9e4f95563ee4c5a14df84ef2494eebde5f3b33bd5f8cc63 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb5280e52e34635b06a7e3c05a9605fa7f5026db --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32fe3152af323a6bfa55e0d6be2798eb3774d45a87afae9d69d8dfdda17435ed +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0179d8a2044bdcfd6b0066cf36ffaf0762dff2ad --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd84fbef8ba316fd24a8b349c2848fb9b7a73bb1f28903be0713e11d619e9e3a +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3d890867e26ea890fdf0961bc4f0baa8cf5472c --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7423aa0c4a73ba222d1252c76a6576598a88afe546f95575084ab5a07956c019 +size 199058722 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26e9d2c430f1ace5e776260ef8759b643cfb3da6 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb34da8b0726624361e970d0d99875a1f5b73d70e4d28dc0f96238ba863ff18d +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cd0a37ccace1cc637e94ad21826903d37b71adc --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38f06f2a074eb8f54954a7917750c2431f08170f6f720a6cfcece95fb65c6791 +size 199058786 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4317c712b5b33785d00d25358039ca5a589efe8b --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1941cad59da9faedbfa07f03ad650ba0509ce137d6c966e331eb48076244771 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d86bf319fceec590173e1aad3c9a1971e443838a --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b653f274ffe539502508beb2ce325ac68255820efb568a83d4b2f91fa4aff58 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64d2d843bd33db44e1cfaffd393052060f2c0e2c --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45ecc3aa8d9b18e327bfd5ef425941835d4fce550063689afb884dc0d1ec2d8e +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e4c0644214239fcb9409f9400151ce1dbdfe905 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51e1c1885e7bf848802269b1e6d6796987cc0f62d49dcf9397e837cefee53033 +size 199058658 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a0417fd9c3b9b7af9084d9b1ff16542568d42aa --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c66fc2d7e3c78feed85eb429ec92726e0613d1457070b5bfd11a910247de2e4 +size 199058839 diff --git a/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2332fc2f08bd13945ded659ec8c6ea948559e27b --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3e686821d8e18f9a39d5892bbb1539f67fdfcffd8e6590af143ff5708f568fc +size 199058839 diff --git a/4b284b84bc4seed1/global_step80108/layer_01-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae5863dcc12d4c274066aad8d4aec5056d3b81f0 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d14ebb2616a8534313683381e112cd7ac7e6e29c48e7001f49eea99740fdb077 +size 167511299 diff --git a/4b284b84bc4seed1/global_step80108/layer_01-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47b22b56ce6133a2a5fb60348b46f793740a1b89 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bc73b8445a58193470b11bc586bd227f57cf2f78bab781eca5d1ce553ac22c2 +size 167511299 diff --git a/4b284b84bc4seed1/global_step80108/layer_03-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39482903c485f9792959e0e0f083269f9ba488b2 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7be6f0928faf9259b9a653cc4370f6771e04e86e07c906a15aeefe66c86fce35 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_03-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c031ba1aa569cfe31e5b699a1347d94ae30cb38 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f1baf1e86ab3fde7db14c386f7df19bf0e2f9f0e28e804e1d89cba2c251fa70 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_04-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6499d6d1b760d36a50ee10592ac1f4b63e6ca96 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1051141f1d36000c2be1cacf955a040168d9979b0281cdd071763049c3d5a91 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_04-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..681056585da9193abc52ddf7e812c42e9ebf027e --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b17dfd0bcd82a7a21449f7ce183efbb6e849558b7f95777521ef670ad781efc +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_05-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..249bb3fc1a12b38f8070362d25505d5e11de2079 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53a4cf59dd0094089a1fc5be82df0e4a903cd8ad56b52ee7809b865376640de4 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_05-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4634beebc30c50494d9540f163593050c9b9f0ca --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2779a458c2824a26fe4875a96aa6b5b61b532011459c2cd7bce741b61b0c0dd +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_06-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff762091c9ca7d5054d60700844891895f3beede --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a737325315e71203ef4f63b55374d2bcae29c04336a7b68c5a4e5867b7ca717f +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_06-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26211a33c5b2fc9ac9cc5c080268c00a44f5fe1d --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b344de261f4b3b5d500541f94ea3f7f9795248e67b046fba3db3a9b7c03229e7 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_07-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3405743255e978244572753ab70bc9bb250fc3e --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6eacaefd308dcbf55dc4c17e015e6140271dcc51ea937e7160b3723c9b2175b7 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_07-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..925de16b466367e4f794e9299e118a26e3ecf917 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e048feb5a19589c81233602628d09a97b963e3412465ae87ca7ca1faab7f762 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_08-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..994699f20665bade1e38ff3f42d70dfcbb8e2215 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6681428ecfb6afd277d8d271b5dc8e5b8edabba321f53704b2c035e2e51fbc0d +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_08-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c1309d4395955cc8ff423d7abc0c7b428a5ad49 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ac460d9a12eb1fbebf2178854ca64536f02e400c06da4d1a623c9ad54080962 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_09-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7bb32315d0d902ee776d7ecd3aa623e440ce9fd --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c996c98537286ea8e73f7d34b26fbedff6926e356fffc63f21ee62764008ea23 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_09-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d4ce0d89a4d24ba3eb768523d98685cf8876914 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:234c0ab0afc7b278dc86a7933db3decb74c4e147b36f96c1b42fe4d7f5911cda +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_10-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cab7f0a4fb2ed1a57e424eca36bf8891b80b519d --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe9cf0a48c4327ab5d640548641a0db7772156c74a4ee55d224ff2215da96975 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_10-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba5252cebcffa51b828a8550038d9a1802f0e708 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd49992a07da248e0a806fb6696ee49b49dbdda68d49ab5efabc20246404f68a +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_11-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e828a4f93878af369ab8360e68492cb9feb4a566 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:970e3dbe1135414e36fae4577791a4e51e1847eeb087458777f0f14913a90f93 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_11-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cbfd4ecd3654b0918fde32bc9c61819dd6cfb6a --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d8fc7a499594336b7db7e9c297f88523a5239decea2bc21ca7b6a3447f5253e +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_12-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0bba8a0549d3f2f52f53fa92f9eacb87c420c66 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe8267326f6a43e802ad8ce1a02e0978e269f26599ca08e683b5771d0cef29c8 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_12-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78d6b64da7fa92e0f3344b01450864b9a1825f87 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:518e403d3a829daf31a3e74855eeca6c890fc2a298e532c465f4004cd89f6f02 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_13-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..beb43a2723ba247926caeaa1b65f0c8ab83b513b --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bc879a1f95b1825acec0277262e7e2cc44c6de0ab988e0a46dd1f006c2fba25 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_13-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44d0855f8649a4cc440e6887d047ea25ea6bfb7c --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:972afd81698f80b3c26618c00f50751757af09884963d299e9fdbdfd8d28c2d5 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_14-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f38b32be4336dbe9a485bf007e857c13f475a8c3 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85e5a8d193fdfb6292837954a1562d0f63ac5fa6a4efd80bddd6486243cdf764 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_14-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95f79a268a9e379a19b71c1f4dcd1af8a825218e --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bd1fb3b80005b96ac9fc4795f74554c6946582398a35c76278b9b186a468b7d +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_15-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d22272347d6524ceb2871a466bffe5062c39adce --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:531931374b5d28a313f1722727d9e5860994c8899f5108cbcafa755754153c7f +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_15-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd693ade07e837502a2d02f088ebabbf06b7555f --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef2a295d9175715ec827c27d2102de867358ed082ed8436b985c920c30982285 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_16-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48deafbb045eff307afd5e9e916a48b764824305 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff71f8af98d60998d469636fd5b5c106db3dc638e499c734c1d6cef2c69eab9b +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_16-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6da4cff63ef0201e51f733d531df79e0dc04e662 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aa471e6b341b20d254fcec8ae1016d9c09acbafa61ece091bdcf69973856a5d +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_17-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00bca189fbdbc38415480c03c26b6206b070e4d4 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48d9b151fef67c55411ddc9784048043b195379633791ff9a19964babcae163f +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_17-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1f67ab1627f5db6c2cc2a887404cfba218b7815 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d8444e238ccd3f79680bef915caaa5585c5871985b0274733afc39f0198bbaf +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_18-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..385e938d3a0609df7085c09c33b415f8be7404dc --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03c05f253f107fa8acba1a870a9e59d53e7f5c7c6bd147d196aa7f48ee392f82 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_18-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e436c3fc62087b200e37f6d86532ad8c8b2ef55 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1456f7ebd3cac3889c88eadd69ee8f067ce8c537118afc471f01b3004126c15 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_19-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f484a24029081376264727830769d169281e458 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b3cd7d6a0f8372d53e62efe60c556f83840aca0b8c15f06d63309fad7a27d09 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_19-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79441df6e06884b99a760af040975326b7dd0929 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:496b963d8ecb54cffb850b01d2a630279ec59fcb70987583c46229e5ef15b74a +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_20-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8371bfe453aedff7a459c3dc90fb9bd36bc2d5b6 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d41d2e5567c44acdccf8b9b79460502216dd43b1f277623f541651008d90e9b +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_20-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34c8e7200b2d2add89552e02e92fee3438d9be5c --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9389dff5fa16be030fa04e786944e76d37051b83d4b74b28c4f4313b6e6a547 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_21-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00acd8c65a0da36d9a7821cf05c7d795adccda56 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:866b80b792d831b33ef3b31ff152243c0062867915709db8ac7a7c3cd13c626a +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_21-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43f5afb73822defa40fb0af9380910d3e4588404 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a336e4b0739e388dc989a52bd36659bc9fe506095e45e058a6d16b588a073d7 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_22-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f0397e6391477dfe630ed06cb5415960ef33401 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9faeb786175524368834fd4a3dc82e2895d4e57b6749f23864e3743906810f0a +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_22-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dc800538e7eb94cfe7a45daa3be0c0c899b9a65 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da145ad98ba6e2a5e8fe2a484c2bc7d0a42548527883657ebc2a0ce5d73b03cb +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_23-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e95ec6978511bb131d70073e104fe879f1d04925 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bfdddc0e79bfd3489c74296793e862a7d6aa5c451e2cc3b2152ae1482b0538a +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_23-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3807b56156d3fa6d9821904e7867d946894d6be --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fceb8a6cba338333f29866246b270d1eb596065f1b590463db55c1b2ff705c6f +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_24-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9871038989fc155fbdd46753fd4b4118f7da7f09 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51e282109f387c19ecf91b373cd464d33822770b8fa1051958748489c4b19268 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_24-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56411d3f918b3514d8578031bf3d18cf1dcded13 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c3e1b65d8cd7651157798a652c093feb14c00d99b4376a40b99be8a559e098a +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_25-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed29bb7e61d3436696f011f3fb16fb31b5a459b1 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2d59d419681711d7ffdd9717306f9a7eda0d3b32bac42f04d2ab3ec1e771253 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_25-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d8fac7320306ce387a262054003234618454885 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d046a5dadfa7a21a676f641771fd6c97f2eabc8b31af47427d690d62510c703 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_26-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13844c0ff66cc979cfb16eb702af1925fef68d64 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ad3bf530633ca68a1720816d6bc2e360e4af088f050f175d02168dcc984696d +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_26-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1daed94bbea79b39df616b3fc55e668fc82a5330 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7890b0e8e99852920256b5a8c82f979478353a685f6100fcafaf97bf3ad469f +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_27-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0d91ebe8bd7332ff3718a37f30fde9fae474122 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ca0b09803311d1ae02d254fbcb172d841a51e15d80cb060c7397f09daa8f4a0 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_27-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0664c4946dbccb74bb8e533564f515e265d54e6e --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30a84eeb6bcd1e7e7cf557eb787e4fa64e6652aa87b76a64631eced153c2697b +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_28-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42eb30dc66ed1379ccfa139ff490f2d4c77a3574 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d702d16f11693a99989ebc5628c7869d3b6971b6c542368c13fa42b3c414b5d +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_28-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c78a6dd7be3921d94f9a67bdc3e4be8597d89508 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:611459c154490c6174ed8db8d7d4170c82738f39a79a5ccfe21412cacdaecdf2 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_29-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a14aa1ab478f9d3df48fffbac771254d17b01dc5 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04d9092b865f4010e34cbe2f043b700d6f54acdfc4d30dd7cb6bc93363b2fab9 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_29-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..caf95cc5cb78589259a88fc4ecfc4feaaddd815c --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:687673d3d7c02c5426654ba486da47bb3ea2847fb7c344804563fb37a98c1163 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_30-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f1c56eb5f9c2259f6fbd03c4bdba8676f163ac1 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a023320944f4c9c879384f0893729f80637ddf3dd837e35c2a66b996a5fbcc01 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_30-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae1fbb041fc86703121ec414fbe2161e5906e041 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:069bc8dc9b8e04fd76df4ab204bc175b7c38b9c73c5672be96f7ffd14e9e5960 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_31-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..248dbdc27a0e54a9ca6d82d94205794452de2736 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91dd0356b437f8b03d92b1cee724966bcbc93af7d4033991a9ac521d7c772597 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_31-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b827c78696f9575f776617450e94b88b401d683 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:513184890cef14198540307daed116b134bd18418ce2d29e4395a1657b7a84af +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_32-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..755e030161d388ba0066b6a1adda9a8bfa005556 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da39c36e345a2a529b4bd86a57b9ea49ed18d86cff682f6a97c4f01db62a1fc2 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_32-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fee159dfe9b42ca6c68c01c7ed2b5d03ffeb48a --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccb458394f13b6db2639e15150f9f3d7584f9411578d6bbd10e45ee0f0a02e13 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_33-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fce2df9bd14dbe987e21150a773bb8da588a89ce --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d85811d387af54aba9c227de4a15d8340386403cc83270e9ba4b426bb5f6761 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_33-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4aabb09763b18c0484e982be5aa0a9d6c000de2e --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35420870d6b74381515a0d334b4f20b36b1a280aaa01c651b1f84a91122c2aaa +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_34-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cdd3a9d9f43115e92c396dcfab6e6bf07a6abe8 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7551aac8710d08a9684b9d7eb5021caab23c8a475a2fc5672ef97bcd2a8fd4c6 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_34-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bafbe4eb8621ebae9183e98cd37af5784e2f6aff --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77ecbcdb1fad0fbd24000b63b854cddc6635e024f7da652ddb1cf112b21b8182 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_35-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e81d6ca54dc7aaefcca0bf210cb22f5ece0df0ab --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ab3f571ca7249e3077565c84a94533938d10f086d754a74da52cbea94825b20 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_35-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a830e2562dde9bf32d6b6eb2f2a39aedeb15f39 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84808b9c66e8b363918699f023ce2b2749a7f233c11dd90acc1c8a87229d15bb +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_36-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f22dd0c1069b9146d4e01dc7c5e03a005fa3e84f --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e221cdfd16550cb2ff7c2d696c94f763eaf4b08e4f26825400e765497bfed4a +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_36-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c97caa2d6610bc670edce9b4afece803559cefae --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07dbda54a07ce7e34e664a0d4ea0ec1f81f5ef905ee7420b8ff8e7680a5b8180 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_37-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0f2b7b6811cb6f0c21f9de1ef446b8e9c1f3515 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:675ebbb4fee20f4d5af9674c79e0a71a4cdb90f25b6a71231597e0ffe102236c +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_37-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25c3b2ff016a22e5660422a1d4a06968a19675fb --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee676b1f0faeaa31504a711a6e0e5866fe86ff78c28e14af50209239ecbd6511 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_38-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf1f7efdf13967f7ae81ec1a4c24720e76362586 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44c3463eb81b1be9097b131d6fe274ab50d09a56554064565b0c51ba7a708a54 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_38-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4240c60845ca4cbf3958e437d958734db3836551 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba44b239a7242d7692e2b39e43593e3106da742d3fbba963a8de30a6f74c9bb4 +size 113308931 diff --git a/4b284b84bc4seed1/global_step80108/layer_40-model_00-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bb5436171f2dce73c82163416a95b41dc526841 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d4feaa7eba171ba39207ec67decf8ad8ec9419a36225e2dbce4b841bc862b41 +size 13507 diff --git a/4b284b84bc4seed1/global_step80108/layer_40-model_01-model_states.pt b/4b284b84bc4seed1/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd70fa0bb2191f33fc56123f181339f4205510fd --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:110f57915eaaa2470ac00d40a00a857b1de1d6ecd6091900afc59a0d80115619 +size 13507 diff --git a/4b284b84bc4seed1/global_step80108/mp_rank_00_model_states.pt b/4b284b84bc4seed1/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0249397c2df491591d57f77c2e7feaaa402808f --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a908cf5bbc396f43f32cbe3bb188e857057b6c9e825ae2f8be595b28117adb6 +size 51443 diff --git a/4b284b84bc4seed1/global_step80108/mp_rank_01_model_states.pt b/4b284b84bc4seed1/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c21b98f846305f5eefa12bfa89d8e5dac26b278 --- /dev/null +++ b/4b284b84bc4seed1/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f849f2d61a8620c8516afdbc0505dd116b2d47683dabcc7cfdbf40cb00a5dee +size 51443 diff --git a/4b284b84bc4seed1/transformers/config.json b/4b284b84bc4seed1/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b84bc4seed1/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b84bc4seed1/transformers/pytorch_model.bin b/4b284b84bc4seed1/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..f7b4640d2752ef63663c40e5961ed3b346ff9bd9 --- /dev/null +++ b/4b284b84bc4seed1/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37331c46b52316508d0defe0faff58fda813b2b0199b0b758f8385221296e6c2 +size 8781203669 diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..351efd1281ac776845f54be4a38c2c270284dc2c --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3463387125507984, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03871898741816671}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07211255715607569, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001551406165163628}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2996849092736172, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004583023786340968}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10952539068797028, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019907747077539725}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03381420888180137, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008950985117036589}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.14844147775806338, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032200950902031658}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05201678241725894, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012570598168046025}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06953968025004763, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014395600092792235}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2927861422575508, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004486869628532065}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10599044553263734, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001858626781810144}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06905492701097961, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014675622764115906}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.28799521128404415, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004338230779660113}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10494341774143819, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018712967363079748}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ec02169f2516d55b601dd4a83710a609afdbd6ce --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.49152208622242877, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04139408950745415}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07373625415642708, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013444564112333292}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3753665468025263, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00536016010380475}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11542248804126877, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001852315570556662}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03437112478262944, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008158271460114628}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1839462343866126, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003709671721946962}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05396039097370975, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011621890988087783}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06891381858838289, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00117848640155061}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3513896637107432, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004856217872136033}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1080526825836882, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016391879678756425}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07022268782208652, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012677785220343175}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3548574219712635, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004914558194954389}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10983109806282532, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017465824716290605}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2b98a731a60759d458df3be3288bb0873cd7c1bb --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5036165898830023, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03163382931247645}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07345117313274237, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012208182117261878}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3941081050839388, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005139991780948632}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11611735091169018, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016856649398913782}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03416030472845622, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007497324529078045}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1960695205229479, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00374456566803786}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.0542677230188957, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001076889081745943}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06848596200566257, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001088456262302762}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3641445841455221, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004555374452263096}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10822818662084129, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015080010309372358}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06991710191369618, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00115124520295404}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.37308280267746685, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004752608689239747}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11045227449849929, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015880076943480838}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..118fe1bd40d69ca52ee48bdbc5a6f582a89157f5 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6498113531541159, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.044359939496823625}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07362728433969368, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012506969519923664}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.40433747874257164, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00532349382454595}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11670639827568505, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017228506693859023}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03462285279213432, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007700688556812641}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20446580518938245, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038704073812126957}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.055174784608656414, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001103480731304987}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06807883372554288, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011054577780329877}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.369498755496309, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004606643368535042}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10780699471813608, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015196469475095016}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06987690204692998, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001181829372472824}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.38020527679899335, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004841997364585111}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11062957727513113, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016229376323127634}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..c262a8aa9b9999cedb36abef6ece9c038567c460 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6676812083161542, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04984003951128037}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07419859091894718, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012073720133260548}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4115156265704582, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005279248235847037}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11795519287394977, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001663656872341927}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03509931891578484, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007461921191218064}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21194614881093146, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003942396709196514}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05617955897318711, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001072962808033341}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.0683956812460672, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010554662078452836}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.37604842524473375, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004602132355576208}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10867138834194551, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014576101979114201}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07053184039179991, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011422521869853676}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3893450058485989, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004865697961495776}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11206081323499055, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001572212563142291}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..117826142bcb9fb301aaae2d6b158ab04a31280c --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7710974467285127, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05203704839844347}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07425806182657936, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0011956495019689597}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.42780274108203253, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005406944243614746}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11877703066041605, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016491364267747024}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03492035728514057, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000728989115137721}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.22003827942872525, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004025013823319427}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05625150089671772, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010511709925049085}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06747232289163295, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001034208622107367}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3846963659749557, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004603801517001138}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10772149028740496, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014157977593889726}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07017346453232838, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001136713184580948}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.40087756811378206, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004939981502609751}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11204458204469926, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015584717483504628}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e6ce3d5170e58783e567630001720d356653aa80 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15426863660325024, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019390767016899475}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.26616584906943935, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002800247123213755}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18179483366438334, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001918528213130623}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.032398604164030766, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007853568426710733}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.059178979799423694, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015378959605561995}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03857873002486118, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008912625012118423}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1178409029648999, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00134426120796486}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.21156320512029583, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002302858626762558}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14062571654868716, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013664451991987955}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.14121341341165533, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017607776877685353}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.24535304568196398, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026196185425979572}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1667428911480839, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017491099585958065}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.7317879218324492, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06258434310865753}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..e458f65eebcce505377479610cd534b079fe3adb --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.2097374056236598, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002558792591642619}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.31993230192333455, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002912578847069188}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.22615743170046998, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019675759971617946}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.05460829335196789, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013104520035504465}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.08436597375871419, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0018136264810112849}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05788753426578909, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011036642735696503}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.14966153212559197, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019100435840523184}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.23314632888007986, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002308314606066584}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.16096845678834487, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013344427734486718}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1969300454898004, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002419281823679596}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.3015516742807266, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027852344656345953}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.21248946284679468, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001850444919705845}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.078946318578733, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.037508376634953426}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..f43a0d3b86587536b92027431c2b7206fbc91c97 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.2249179940170448, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002953091033379103}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.30791265980488064, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028052680018540153}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.22500809081344597, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019395777660833832}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.06082816124882105, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015517487698999066}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.08191649217784704, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017207233219242591}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.058940718015282535, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011427794692985003}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1651950475417842, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0023849745375518774}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.22637843422800283, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002257218203318618}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1629946491305722, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001412842903446524}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.21271781118896244, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0027972927699949795}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.29203959550294045, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002679740707668158}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.21287275166909125, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001828524451639913}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.331365912474371, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03901431585240638}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..102c2c4ef19637a6ae84f09726ab5f63ca4996dc --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1984883398198494, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003387900153458854}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2444675402553931, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003332060879697036}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1828984280612045, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00233789023320496}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.05494653639366956, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00172026049377679}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06573981524186268, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001646361012922936}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.048423081518600516, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011278965656492843}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.14973545109772782, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002771115067407858}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1820828761022503, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002594908370622835}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13482403873394622, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017315326993232382}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1876688685476534, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003222108012150837}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.23146444735253652, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003170383006624478}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1727178547993039, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022030460306759693}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.4654459013677066, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09533106520935124}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..e2fa3ed98e3c7c5b4c78b12bbbb651c53720ce31 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.06373323883393266, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0025948109156841556}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.07974114305386926, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002852169393376925}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.057249298351433005, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001981710879314234}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.017183606562936146, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001165303674699654}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.021451383479229473, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00115814797861179}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.014679683423748945, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007250006064285315}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.049676263167134256, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0021317796688731104}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.061127221909033094, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022295833532602533}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.04339902158323832, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014931210623861644}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.059918160107108445, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002458251392796141}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.07475299437390277, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026852062028548873}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.05356492994210666, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018539473478258858}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.5096514625512257, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04746911438860582}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..a920195035388983f99247ae8300c14c73e8c83d --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.00974635222327858, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0010426157804008867}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.013305767376845547, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.001294486365694067}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.009381663500620675, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0009033228148794374}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0027541706176161013, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0004991531053543725}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0034881657779112446, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0004828260114230198}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.002426218955168773, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00032099513562133}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.007558937884226414, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0008514792129217634}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.010297022985567691, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0010209752122782392}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.007132684824681642, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006849988631397933}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.00925164902439946, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001003429166331945}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.012522528933544396, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0012265948088620682}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.008824412648201954, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0008523533756253951}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.4367817796838913e-07, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 5.931740679366216e-07}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..76ad0d64f73ba38749ee67e6a40a9d55c2d9afe7 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 1.4674593008700727, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07690373053792376}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.05683753991737235, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014560506575201325}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.08937391024861521, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002366915901253559}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.06377803506212068, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001672122677396593}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.012214590726895359, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0005743247716736654}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.021379218732414145, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0009966104546792834}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.015238638354519577, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007071169872858592}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.05347894988195794, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013049823564136975}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.08437384990508254, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021538312776559535}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.059880641876164487, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014895688210922907}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.05199652967109443, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001336335232731129}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.08011650518165435, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0021036901960562}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.057561121270217515, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0014995174600948955}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..91bc7ba27016ca501ac329f03d88f0f5e4cacce8 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.256639255609565, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.13909119146023038}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5241369762469382, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032402613188758484}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4154073794853628, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029811452241909936}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.43826153885312474, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023680361634807615}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.24440729108549972, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025713353876726987}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1903569141394937, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002085369890907639}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.20120573159323082, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019466830589320579}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3797441094381383, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002849422577384458}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.2977661478395331, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023832352149522175}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.31512942959617346, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020245073951865498}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4269573872984081, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003094947485413177}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.33674441043750625, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00269773822444997}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.35586936216582027, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002288936359442796}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..5b138307cd085597a079da82808aed295a7a4f8a --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.376126264980714, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.2423138700015996}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5586896631262273, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032542273894082263}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4534492320208494, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029116157123098745}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.47582339525157197, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022765247887398116}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.27694841097623996, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002758389324353955}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2206909261465891, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021891415728379693}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23204546503817813, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002046713809774589}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.40753042690914904, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002988569615037221}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3271426648953936, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002412434421850288}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34446258237680916, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020760578430186376}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4602485572678633, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003204122515744201}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3712619134780482, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026876195742092054}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.39054726501758946, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002301771792227363}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ed71489385825bc824f4b46623b64503754fb391 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.093165522897872, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.21216386354546166}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5387233761250629, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031864759527455624}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4726895100996329, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002899854544961585}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4785676515677228, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022234504082830633}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2685393636176561, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026170967343239477}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.23277587897646693, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022527763377626336}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23558342825678338, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002030621156209231}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.39161805848668024, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002876699759638117}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.34175514874890695, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024862399492205957}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34641516486003826, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020831944107613303}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.44704833712523245, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003092169155791799}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3913487563855888, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027430209943532587}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3965640250353348, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022751928578861502}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..deeb27730e276f002dee901948b15d4cfe552b48 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.01877522701202, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1634606411416184}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4967367435501768, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002997180519517344}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.48986433299719573, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028919527625229664}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.47017887879088466, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00215775715520141}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.24350630882815852, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002422719426969184}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2387594057692899, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022672859667634986}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2285190900484798, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001968236514909628}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3508199102140834, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002597964369996749}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.34517696947416515, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024767421656897485}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3311043111563345, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001975651372330419}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4096834114721446, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0028584575443569072}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4045460483730194, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002787010565242438}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3879654204025311, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00222102600090257}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..e6a0052d5cabf6e4bfba98a715075888ee9ab825 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.738533814250154, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.20692029359403782}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4557324007548413, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026141133736043063}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.5008190200746241, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027912701451645113}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4579176439966838, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019838649103218315}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.21649241809836905, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0020808047468387015}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.23946332773224333, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022622492821207474}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.21699681614941907, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018260134934355917}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.31896738977233224, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002249879972490852}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3516931047967278, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024669281840779384}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3204737144833669, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018416039122686005}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3790705627204969, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0024962460456464603}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4171792042608784, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027157128707540365}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.38110492282903374, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020518013347156708}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_0.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..06541110dfea51c5c88970b8f85b75c5c85825dc --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.17320559498489507, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0025525024097035748}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.33568511811329627, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004457272030335943}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2173222672616331, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026735963951633086}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03984347722138949, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0014498730660041778}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.08293611853648174, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027922604769135967}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.05119317937818865, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016915277669349944}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1306308027797899, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001979750535716133}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.25481924486600754, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034477504419509046}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.16413944160730887, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020492207241516436}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.13618964667417757, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020883754136888665}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2671983620973551, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0038518682770408703}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.17170031392993537, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002265881556419863}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.2151365071026334, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10551243625041298}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_1.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..65ccc1e07de2bd9a3fcfeb18dda697017b7c239d --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.13193321373947423, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018249214408045705}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.32491663088067385, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004280533648795701}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.18543200867192464, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024553301715842025}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02885078338766851, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010494871344340587}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07423283049608298, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027810291758957346}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04099230088578755, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014846354986486204}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10387006177524372, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013802990359211345}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2578619666146113, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003428735324171146}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14626844109613504, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018773361178004498}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10445447840702451, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001509990224349501}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2598290086664842, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0037495698358454184}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1472004999527075, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020688083081768726}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.5874448429909755, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07657449929611179}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_2.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d024f6f9f406f3159f606b882c5fffe871cc4fac --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.13378369552141486, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001828879330748606}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.32737811206091777, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004306408194620798}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.18753394533546663, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024632687591213827}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0299925935097244, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010381433997656876}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07593086345843493, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027442526221015794}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04246731521010523, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014710047875479853}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10643964494355733, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013938532111114862}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.26198866539949395, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034185812335638674}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14937612301640457, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018862901936057773}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10465900735165316, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014985247658685268}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.25870432987334707, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0037543234582558148}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14706588908674015, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020537944843788485}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.620400084032387, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1036187597036037}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_3.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..024174476ba87ae6860088105bad61994071e22e --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1325857147512653, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002104582538451698}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.310270163693354, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004622235270535744}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.181742673631377, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026996346996907114}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.030071518934551324, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010760225740262315}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07399993568063115, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027512935104685335}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.041996639319967895, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014924431333982891}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10572519383258887, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001594887821630211}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24999311515441475, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0037295235353239403}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1455139114170652, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002103135242813012}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10501603221104056, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017119294258030526}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24836824871710267, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003968401031348439}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1443734491656482, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002242271836640455}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.6556986327135799, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09408085446538644}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_4.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..22213b72bf286abb8328a02f13bd03929a19de98 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.04185793101612411, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0025354871639657332}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.07960189442566881, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004594099676529609}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.051203664083526064, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002916215578123627}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.009545271254314988, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009027168872299666}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.019489192736000506, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016525733661952122}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.012145091480254444, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001038605071999789}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.03331696824804232, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002048247078605598}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.06320111546579645, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0036120398264049094}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.040479741202891835, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0022777830898179745}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.033884182850020796, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021113829994884406}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0637408678817515, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003715585442877857}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.041001723419299384, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023481586557545764}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.8787323538547989, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09806037997681721}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_5.json b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..a12592eb29e890ec317bfd18344b2ce7b389816b --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/agg.4b284b84bc4seed2_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.003661405957465891, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0010410174134967514}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.003073378808572809, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0008998604189966408}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.003279934928320664, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0009428534366320934}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0007725002522449804, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0003775496435431225}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0007322912012146197, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0003972475356359937}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0007405035248494208, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00038311030521319677}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.002439909640242604, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006917842321148266}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0020657262287064482, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.000601437175466453}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0021896510504014074, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006251341441438973}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0030026261505173824, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0008643214712623419}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.002523952641616138, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0007458033281437961}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0026863003460885, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007784026207598828}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 6.480764426251045e-36, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.6529080147588964e-30}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..57baf9d28e86eeeff551e96851f98491e494344f --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75957884600dab9be9bc155e2e1081e92e445dde23967ee12389a412dac3ce75 +size 4137129 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5e8d4e363051ce9a439d3784796c9bca0cb51c09 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0bfbf192fe7e518e764bd456d3e9047f8433b9033574cd2be59588daa5d5937 +size 5145276 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3e88887a1fbaaf376c87390c04c81b76c70c0b9a --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfd5666d3c4fa4fe6dda491c97dfc0e55c7f2c6dbb28bc76545ea432cfc776e1 +size 6056056 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e863327ce917de3e14cac7f84b33891d950883b3 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ed7759819b4cf9c106c5ed638741ab1ac91c7e286a9d7f956ab8cc6e046eac7 +size 6983686 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1c924330a08d96841bb6d0fd968e77e279275aca --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8012220cce244292caab760c396053aed9a3fcf322b0a93d64eb05bc2ef6f92 +size 7882083 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..78e2bb7558d780cbee242141a5f623fe4f2ef3a4 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1c5adb26a66de3c29559c893c0dcf9a9203c92675da2f03887371e14a2ff259 +size 8814514 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..dc859b16cff644a3932f861ded804d5fb9565417 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af66dd60ef7af298de8d631ee5d6dd536aba72e7e7078ff2931af0f9c3b9cd7c +size 7692763 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..aadadc62ecf88c1fc64548ab20f416f4d60b5301 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:537f069fde36846318df23d90d8c555c2f180d3ae8e5d0d10df178ba5f7be4d4 +size 13291456 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d3ecd592e267023f5b910240e9fe6b2c5bd7b9e3 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b401a8175e7c448b34cf80faf21321cba1fe0528aa8799c2be4afe95fd447f8a +size 18860517 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c30c446d99b44625f950351caa2ada78f7d6c5d6 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4f15a4beb06bc5bfa9589cea87b8f40bdbe004f1adfc45e06ac1cfc50001c40 +size 24255090 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ee8c4dbf6492e311e7953e2170bd31fd7feaa47d --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a60fc718772b8b940b3d6f5c21c7ad5f12f5225b460526b5f67edbde4c07b63 +size 29444986 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0373e42fe2fd27c14ace9dd01cf1fdcfdc25781d --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6446e6e3d693d1afa345eef60f7c4e6ab5aeecc789a36050ab7ca46c85d40358 +size 34796088 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ccc35810ab3fde48251ca1644ebfcdf080fb41c8 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca4c3943a3b62ae86db4c90919d4d3a31d2338727b5e135365d6dfa8f1ae103b +size 4405383 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6f1ec5f01a3b8449cb2232e7a5cf0c91ad826437 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7e54b0f016ed5a015764d9e9e101b2db2ac229088411bc493f41d05d17293bd +size 5027922 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fa0ca0b4e832a4bdb8ee3a56c45ec883caa7d530 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb9aa3005158c1ad1b4b811cb2887f6ba1854d6aab4d733a356b62e12995dcbe +size 6122719 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c72612293854f7d45984e6cb82cf091c6c2ed691 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1cdc64e365e74930c83ba4138f6776e590980530d52b27840e4c9664b2bcef0 +size 7238288 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0952960fc66b2d4b3ea7701b7c12ff0f0a1457e4 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be8e8e62050e73236f7a9fa4aaa78bf83afb8755d5c8806c8d546471c67d4e82 +size 8368065 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1b62545a4af56c934cfa82902f5ae373b5bdad57 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c197ac383c4f48da6424a30c0db33871b43c387e86693ef6067e6ec3eb59eb4d +size 9501406 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_0.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c6ac94b8d00ead473751430584c904bfc45df905 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:671c4c4576e1d191ee88f37a4fdb15207f2c54382632b3092b788edcf0259129 +size 2784524 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_1.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0aa781859ee09363964902c7db57d4e0b9864b4b --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:369db13d665cd21ec44da0d27db6bc5890b0ab3107351e21d6fffa545e632c18 +size 5101838 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_2.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d7408600fdcd9d3aa90fcdc9e9c52f403528e3d3 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb0583d3206e6ba5ae253b9696f538d9b27dc6487185b6293d23a89ce654e013 +size 7377505 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_3.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a9f6679800b469608c66820fdf39c9070ab549bc --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b6c82d5f552be2d3ed7d498642cb148d10b9ec4b7257186d4143b84caffb726 +size 9646166 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_4.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c7ca00ef0cdaf16069024d75e9c37583f24358e7 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a687480776ea4c950663d4f00e9f684a1e53493a65314bd198df64b82f509139 +size 11671916 diff --git a/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_5.jsonl b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..83443e3220b018f0c8ede69aaffa7aafb8d8e766 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/examples.4b284b84bc4seed2_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a22e360a1f888b726b5803362a4610dae655a309b4a51fc166786ce82382262e +size 13897513 diff --git a/4b284b84bc4seed2/evaluation/generation/merged.csv b/4b284b84bc4seed2/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..3d87be1440411960252b238030e01ff1861b4c57 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.015238638354519577 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.015238638354519577 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.20120573159323082 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.20120573159323082 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.23204546503817813 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.23204546503817813 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.23558342825678338 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.23558342825678338 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.2285190900484798 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.2285190900484798 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.21699681614941907 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.21699681614941907 +e2e_nlg_cleaned,5,average,multiple,0.18826486157343514 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.05119317937818865 +gem_xsum,0,median,rouge2_fmeasure,0.05119317937818865 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.04099230088578755 +gem_xsum,1,median,rouge2_fmeasure,0.04099230088578755 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.04246731521010523 +gem_xsum,2,median,rouge2_fmeasure,0.04246731521010523 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.041996639319967895 +gem_xsum,3,median,rouge2_fmeasure,0.041996639319967895 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.012145091480254444 +gem_xsum,4,median,rouge2_fmeasure,0.012145091480254444 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.0007405035248494208 +gem_xsum,5,median,rouge2_fmeasure,0.0007405035248494208 +gem_xsum,5,average,multiple,0.0315891716331922 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.05201678241725894 +web_nlg_en,0,median,rouge2_fmeasure,0.05201678241725894 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.05396039097370975 +web_nlg_en,1,median,rouge2_fmeasure,0.05396039097370975 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.0542677230188957 +web_nlg_en,2,median,rouge2_fmeasure,0.0542677230188957 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.055174784608656414 +web_nlg_en,3,median,rouge2_fmeasure,0.055174784608656414 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.05617955897318711 +web_nlg_en,4,median,rouge2_fmeasure,0.05617955897318711 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.05625150089671772 +web_nlg_en,5,median,rouge2_fmeasure,0.05625150089671772 +web_nlg_en,5,average,multiple,0.05464179014807094 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.03857873002486118 +wiki_lingua_en,0,median,rouge2_fmeasure,0.03857873002486118 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.05788753426578909 +wiki_lingua_en,1,median,rouge2_fmeasure,0.05788753426578909 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.058940718015282535 +wiki_lingua_en,2,median,rouge2_fmeasure,0.058940718015282535 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.048423081518600516 +wiki_lingua_en,3,median,rouge2_fmeasure,0.048423081518600516 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.014679683423748945 +wiki_lingua_en,4,median,rouge2_fmeasure,0.014679683423748945 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.002426218955168773 +wiki_lingua_en,5,median,rouge2_fmeasure,0.002426218955168773 +wiki_lingua_en,5,average,multiple,0.03682266103390851 diff --git a/4b284b84bc4seed2/evaluation/generation/merged.json b/4b284b84bc4seed2/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..2b285be260699eb0cb65a7299b49649f69a70fc9 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.3463387125507984, "bleu_stderr": 0.03871898741816671, "rouge1_fmeasure": 0.10952539068797028, "rouge1_fmeasure_stderr": 0.0019907747077539725, "rouge1_precision": 0.07211255715607569, "rouge1_precision_stderr": 0.001551406165163628, "rouge1_recall": 0.2996849092736172, "rouge1_recall_stderr": 0.004583023786340968, "rouge2_fmeasure": 0.05201678241725894, "rouge2_fmeasure_stderr": 0.0012570598168046025, "rouge2_precision": 0.03381420888180137, "rouge2_precision_stderr": 0.0008950985117036589, "rouge2_recall": 0.14844147775806338, "rouge2_recall_stderr": 0.0032200950902031658, "rougeL_fmeasure": 0.10599044553263734, "rougeL_fmeasure_stderr": 0.001858626781810144, "rougeL_precision": 0.06953968025004763, "rougeL_precision_stderr": 0.0014395600092792235, "rougeL_recall": 0.2927861422575508, "rougeL_recall_stderr": 0.004486869628532065, "rougeLsum_fmeasure": 0.10494341774143819, "rougeLsum_fmeasure_stderr": 0.0018712967363079748, "rougeLsum_precision": 0.06905492701097961, "rougeLsum_precision_stderr": 0.0014675622764115906, "rougeLsum_recall": 0.28799521128404415, "rougeLsum_recall_stderr": 0.004338230779660113}}, "1": {"PALM_prompt": {"bleu": 0.49152208622242877, "bleu_stderr": 0.04139408950745415, "rouge1_fmeasure": 0.11542248804126877, "rouge1_fmeasure_stderr": 0.001852315570556662, "rouge1_precision": 0.07373625415642708, "rouge1_precision_stderr": 0.0013444564112333292, "rouge1_recall": 0.3753665468025263, "rouge1_recall_stderr": 0.00536016010380475, "rouge2_fmeasure": 0.05396039097370975, "rouge2_fmeasure_stderr": 0.0011621890988087783, "rouge2_precision": 0.03437112478262944, "rouge2_precision_stderr": 0.0008158271460114628, "rouge2_recall": 0.1839462343866126, "rouge2_recall_stderr": 0.003709671721946962, "rougeL_fmeasure": 0.1080526825836882, "rougeL_fmeasure_stderr": 0.0016391879678756425, "rougeL_precision": 0.06891381858838289, "rougeL_precision_stderr": 0.00117848640155061, "rougeL_recall": 0.3513896637107432, "rougeL_recall_stderr": 0.004856217872136033, "rougeLsum_fmeasure": 0.10983109806282532, "rougeLsum_fmeasure_stderr": 0.0017465824716290605, "rougeLsum_precision": 0.07022268782208652, "rougeLsum_precision_stderr": 0.0012677785220343175, "rougeLsum_recall": 0.3548574219712635, "rougeLsum_recall_stderr": 0.004914558194954389}}, "2": {"PALM_prompt": {"bleu": 0.5036165898830023, "bleu_stderr": 0.03163382931247645, "rouge1_fmeasure": 0.11611735091169018, "rouge1_fmeasure_stderr": 0.0016856649398913782, "rouge1_precision": 0.07345117313274237, "rouge1_precision_stderr": 0.0012208182117261878, "rouge1_recall": 0.3941081050839388, "rouge1_recall_stderr": 0.005139991780948632, "rouge2_fmeasure": 0.0542677230188957, "rouge2_fmeasure_stderr": 0.001076889081745943, "rouge2_precision": 0.03416030472845622, "rouge2_precision_stderr": 0.0007497324529078045, "rouge2_recall": 0.1960695205229479, "rouge2_recall_stderr": 0.00374456566803786, "rougeL_fmeasure": 0.10822818662084129, "rougeL_fmeasure_stderr": 0.0015080010309372358, "rougeL_precision": 0.06848596200566257, "rougeL_precision_stderr": 0.001088456262302762, "rougeL_recall": 0.3641445841455221, "rougeL_recall_stderr": 0.004555374452263096, "rougeLsum_fmeasure": 0.11045227449849929, "rougeLsum_fmeasure_stderr": 0.0015880076943480838, "rougeLsum_precision": 0.06991710191369618, "rougeLsum_precision_stderr": 0.00115124520295404, "rougeLsum_recall": 0.37308280267746685, "rougeLsum_recall_stderr": 0.004752608689239747}}, "3": {"PALM_prompt": {"bleu": 0.6498113531541159, "bleu_stderr": 0.044359939496823625, "rouge1_fmeasure": 0.11670639827568505, "rouge1_fmeasure_stderr": 0.0017228506693859023, "rouge1_precision": 0.07362728433969368, "rouge1_precision_stderr": 0.0012506969519923664, "rouge1_recall": 0.40433747874257164, "rouge1_recall_stderr": 0.00532349382454595, "rouge2_fmeasure": 0.055174784608656414, "rouge2_fmeasure_stderr": 0.001103480731304987, "rouge2_precision": 0.03462285279213432, "rouge2_precision_stderr": 0.0007700688556812641, "rouge2_recall": 0.20446580518938245, "rouge2_recall_stderr": 0.0038704073812126957, "rougeL_fmeasure": 0.10780699471813608, "rougeL_fmeasure_stderr": 0.0015196469475095016, "rougeL_precision": 0.06807883372554288, "rougeL_precision_stderr": 0.0011054577780329877, "rougeL_recall": 0.369498755496309, "rougeL_recall_stderr": 0.004606643368535042, "rougeLsum_fmeasure": 0.11062957727513113, "rougeLsum_fmeasure_stderr": 0.0016229376323127634, "rougeLsum_precision": 0.06987690204692998, "rougeLsum_precision_stderr": 0.001181829372472824, "rougeLsum_recall": 0.38020527679899335, "rougeLsum_recall_stderr": 0.004841997364585111}}, "4": {"PALM_prompt": {"bleu": 0.6676812083161542, "bleu_stderr": 0.04984003951128037, "rouge1_fmeasure": 0.11795519287394977, "rouge1_fmeasure_stderr": 0.001663656872341927, "rouge1_precision": 0.07419859091894718, "rouge1_precision_stderr": 0.0012073720133260548, "rouge1_recall": 0.4115156265704582, "rouge1_recall_stderr": 0.005279248235847037, "rouge2_fmeasure": 0.05617955897318711, "rouge2_fmeasure_stderr": 0.001072962808033341, "rouge2_precision": 0.03509931891578484, "rouge2_precision_stderr": 0.0007461921191218064, "rouge2_recall": 0.21194614881093146, "rouge2_recall_stderr": 0.003942396709196514, "rougeL_fmeasure": 0.10867138834194551, "rougeL_fmeasure_stderr": 0.0014576101979114201, "rougeL_precision": 0.0683956812460672, "rougeL_precision_stderr": 0.0010554662078452836, "rougeL_recall": 0.37604842524473375, "rougeL_recall_stderr": 0.004602132355576208, "rougeLsum_fmeasure": 0.11206081323499055, "rougeLsum_fmeasure_stderr": 0.001572212563142291, "rougeLsum_precision": 0.07053184039179991, "rougeLsum_precision_stderr": 0.0011422521869853676, "rougeLsum_recall": 0.3893450058485989, "rougeLsum_recall_stderr": 0.004865697961495776}}, "5": {"PALM_prompt": {"bleu": 0.7710974467285127, "bleu_stderr": 0.05203704839844347, "rouge1_fmeasure": 0.11877703066041605, "rouge1_fmeasure_stderr": 0.0016491364267747024, "rouge1_precision": 0.07425806182657936, "rouge1_precision_stderr": 0.0011956495019689597, "rouge1_recall": 0.42780274108203253, "rouge1_recall_stderr": 0.005406944243614746, "rouge2_fmeasure": 0.05625150089671772, "rouge2_fmeasure_stderr": 0.0010511709925049085, "rouge2_precision": 0.03492035728514057, "rouge2_precision_stderr": 0.000728989115137721, "rouge2_recall": 0.22003827942872525, "rouge2_recall_stderr": 0.004025013823319427, "rougeL_fmeasure": 0.10772149028740496, "rougeL_fmeasure_stderr": 0.0014157977593889726, "rougeL_precision": 0.06747232289163295, "rougeL_precision_stderr": 0.001034208622107367, "rougeL_recall": 0.3846963659749557, "rougeL_recall_stderr": 0.004603801517001138, "rougeLsum_fmeasure": 0.11204458204469926, "rougeLsum_fmeasure_stderr": 0.0015584717483504628, "rougeLsum_precision": 0.07017346453232838, "rougeLsum_precision_stderr": 0.001136713184580948, "rougeLsum_recall": 0.40087756811378206, "rougeLsum_recall_stderr": 0.004939981502609751}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.7317879218324492, "bleu_stderr": 0.06258434310865753, "rouge1_fmeasure": 0.18179483366438334, "rouge1_fmeasure_stderr": 0.001918528213130623, "rouge1_precision": 0.15426863660325024, "rouge1_precision_stderr": 0.0019390767016899475, "rouge1_recall": 0.26616584906943935, "rouge1_recall_stderr": 0.002800247123213755, "rouge2_fmeasure": 0.03857873002486118, "rouge2_fmeasure_stderr": 0.0008912625012118423, "rouge2_precision": 0.032398604164030766, "rouge2_precision_stderr": 0.0007853568426710733, "rouge2_recall": 0.059178979799423694, "rouge2_recall_stderr": 0.0015378959605561995, "rougeL_fmeasure": 0.14062571654868716, "rougeL_fmeasure_stderr": 0.0013664451991987955, "rougeL_precision": 0.1178409029648999, "rougeL_precision_stderr": 0.00134426120796486, "rougeL_recall": 0.21156320512029583, "rougeL_recall_stderr": 0.002302858626762558, "rougeLsum_fmeasure": 0.1667428911480839, "rougeLsum_fmeasure_stderr": 0.0017491099585958065, "rougeLsum_precision": 0.14121341341165533, "rougeLsum_precision_stderr": 0.0017607776877685353, "rougeLsum_recall": 0.24535304568196398, "rougeLsum_recall_stderr": 0.0026196185425979572}}, "1": {"tldr_en": {"bleu": 3.078946318578733, "bleu_stderr": 0.037508376634953426, "rouge1_fmeasure": 0.22615743170046998, "rouge1_fmeasure_stderr": 0.0019675759971617946, "rouge1_precision": 0.2097374056236598, "rouge1_precision_stderr": 0.002558792591642619, "rouge1_recall": 0.31993230192333455, "rouge1_recall_stderr": 0.002912578847069188, "rouge2_fmeasure": 0.05788753426578909, "rouge2_fmeasure_stderr": 0.0011036642735696503, "rouge2_precision": 0.05460829335196789, "rouge2_precision_stderr": 0.0013104520035504465, "rouge2_recall": 0.08436597375871419, "rouge2_recall_stderr": 0.0018136264810112849, "rougeL_fmeasure": 0.16096845678834487, "rougeL_fmeasure_stderr": 0.0013344427734486718, "rougeL_precision": 0.14966153212559197, "rougeL_precision_stderr": 0.0019100435840523184, "rougeL_recall": 0.23314632888007986, "rougeL_recall_stderr": 0.002308314606066584, "rougeLsum_fmeasure": 0.21248946284679468, "rougeLsum_fmeasure_stderr": 0.001850444919705845, "rougeLsum_precision": 0.1969300454898004, "rougeLsum_precision_stderr": 0.002419281823679596, "rougeLsum_recall": 0.3015516742807266, "rougeLsum_recall_stderr": 0.0027852344656345953}}, "2": {"tldr_en": {"bleu": 3.331365912474371, "bleu_stderr": 0.03901431585240638, "rouge1_fmeasure": 0.22500809081344597, "rouge1_fmeasure_stderr": 0.0019395777660833832, "rouge1_precision": 0.2249179940170448, "rouge1_precision_stderr": 0.002953091033379103, "rouge1_recall": 0.30791265980488064, "rouge1_recall_stderr": 0.0028052680018540153, "rouge2_fmeasure": 0.058940718015282535, "rouge2_fmeasure_stderr": 0.0011427794692985003, "rouge2_precision": 0.06082816124882105, "rouge2_precision_stderr": 0.0015517487698999066, "rouge2_recall": 0.08191649217784704, "rouge2_recall_stderr": 0.0017207233219242591, "rougeL_fmeasure": 0.1629946491305722, "rougeL_fmeasure_stderr": 0.001412842903446524, "rougeL_precision": 0.1651950475417842, "rougeL_precision_stderr": 0.0023849745375518774, "rougeL_recall": 0.22637843422800283, "rougeL_recall_stderr": 0.002257218203318618, "rougeLsum_fmeasure": 0.21287275166909125, "rougeLsum_fmeasure_stderr": 0.001828524451639913, "rougeLsum_precision": 0.21271781118896244, "rougeLsum_precision_stderr": 0.0027972927699949795, "rougeLsum_recall": 0.29203959550294045, "rougeLsum_recall_stderr": 0.002679740707668158}}, "3": {"tldr_en": {"bleu": 3.4654459013677066, "bleu_stderr": 0.09533106520935124, "rouge1_fmeasure": 0.1828984280612045, "rouge1_fmeasure_stderr": 0.00233789023320496, "rouge1_precision": 0.1984883398198494, "rouge1_precision_stderr": 0.003387900153458854, "rouge1_recall": 0.2444675402553931, "rouge1_recall_stderr": 0.003332060879697036, "rouge2_fmeasure": 0.048423081518600516, "rouge2_fmeasure_stderr": 0.0011278965656492843, "rouge2_precision": 0.05494653639366956, "rouge2_precision_stderr": 0.00172026049377679, "rouge2_recall": 0.06573981524186268, "rouge2_recall_stderr": 0.001646361012922936, "rougeL_fmeasure": 0.13482403873394622, "rougeL_fmeasure_stderr": 0.0017315326993232382, "rougeL_precision": 0.14973545109772782, "rougeL_precision_stderr": 0.002771115067407858, "rougeL_recall": 0.1820828761022503, "rougeL_recall_stderr": 0.002594908370622835, "rougeLsum_fmeasure": 0.1727178547993039, "rougeLsum_fmeasure_stderr": 0.0022030460306759693, "rougeLsum_precision": 0.1876688685476534, "rougeLsum_precision_stderr": 0.003222108012150837, "rougeLsum_recall": 0.23146444735253652, "rougeLsum_recall_stderr": 0.003170383006624478}}, "4": {"tldr_en": {"bleu": 0.5096514625512257, "bleu_stderr": 0.04746911438860582, "rouge1_fmeasure": 0.057249298351433005, "rouge1_fmeasure_stderr": 0.001981710879314234, "rouge1_precision": 0.06373323883393266, "rouge1_precision_stderr": 0.0025948109156841556, "rouge1_recall": 0.07974114305386926, "rouge1_recall_stderr": 0.002852169393376925, "rouge2_fmeasure": 0.014679683423748945, "rouge2_fmeasure_stderr": 0.0007250006064285315, "rouge2_precision": 0.017183606562936146, "rouge2_precision_stderr": 0.001165303674699654, "rouge2_recall": 0.021451383479229473, "rouge2_recall_stderr": 0.00115814797861179, "rougeL_fmeasure": 0.04339902158323832, "rougeL_fmeasure_stderr": 0.0014931210623861644, "rougeL_precision": 0.049676263167134256, "rougeL_precision_stderr": 0.0021317796688731104, "rougeL_recall": 0.061127221909033094, "rougeL_recall_stderr": 0.0022295833532602533, "rougeLsum_fmeasure": 0.05356492994210666, "rougeLsum_fmeasure_stderr": 0.0018539473478258858, "rougeLsum_precision": 0.059918160107108445, "rougeLsum_precision_stderr": 0.002458251392796141, "rougeLsum_recall": 0.07475299437390277, "rougeLsum_recall_stderr": 0.0026852062028548873}}, "5": {"tldr_en": {"bleu": 2.4367817796838913e-07, "bleu_stderr": 5.931740679366216e-07, "rouge1_fmeasure": 0.009381663500620675, "rouge1_fmeasure_stderr": 0.0009033228148794374, "rouge1_precision": 0.00974635222327858, "rouge1_precision_stderr": 0.0010426157804008867, "rouge1_recall": 0.013305767376845547, "rouge1_recall_stderr": 0.001294486365694067, "rouge2_fmeasure": 0.002426218955168773, "rouge2_fmeasure_stderr": 0.00032099513562133, "rouge2_precision": 0.0027541706176161013, "rouge2_precision_stderr": 0.0004991531053543725, "rouge2_recall": 0.0034881657779112446, "rouge2_recall_stderr": 0.0004828260114230198, "rougeL_fmeasure": 0.007132684824681642, "rougeL_fmeasure_stderr": 0.0006849988631397933, "rougeL_precision": 0.007558937884226414, "rougeL_precision_stderr": 0.0008514792129217634, "rougeL_recall": 0.010297022985567691, "rougeL_recall_stderr": 0.0010209752122782392, "rougeLsum_fmeasure": 0.008824412648201954, "rougeLsum_fmeasure_stderr": 0.0008523533756253951, "rougeLsum_precision": 0.00925164902439946, "rougeLsum_precision_stderr": 0.001003429166331945, "rougeLsum_recall": 0.012522528933544396, "rougeLsum_recall_stderr": 0.0012265948088620682}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 1.4674593008700727, "bleu_stderr": 0.07690373053792376, "rouge1_fmeasure": 0.06377803506212068, "rouge1_fmeasure_stderr": 0.001672122677396593, "rouge1_precision": 0.05683753991737235, "rouge1_precision_stderr": 0.0014560506575201325, "rouge1_recall": 0.08937391024861521, "rouge1_recall_stderr": 0.002366915901253559, "rouge2_fmeasure": 0.015238638354519577, "rouge2_fmeasure_stderr": 0.0007071169872858592, "rouge2_precision": 0.012214590726895359, "rouge2_precision_stderr": 0.0005743247716736654, "rouge2_recall": 0.021379218732414145, "rouge2_recall_stderr": 0.0009966104546792834, "rougeL_fmeasure": 0.059880641876164487, "rougeL_fmeasure_stderr": 0.0014895688210922907, "rougeL_precision": 0.05347894988195794, "rougeL_precision_stderr": 0.0013049823564136975, "rougeL_recall": 0.08437384990508254, "rougeL_recall_stderr": 0.0021538312776559535, "rougeLsum_fmeasure": 0.057561121270217515, "rougeLsum_fmeasure_stderr": 0.0014995174600948955, "rougeLsum_precision": 0.05199652967109443, "rougeLsum_precision_stderr": 0.001336335232731129, "rougeLsum_recall": 0.08011650518165435, "rougeLsum_recall_stderr": 0.0021036901960562}}, "1": {"generate_text_restaurant": {"bleu": 11.256639255609565, "bleu_stderr": 0.13909119146023038, "rouge1_fmeasure": 0.43826153885312474, "rouge1_fmeasure_stderr": 0.0023680361634807615, "rouge1_precision": 0.5241369762469382, "rouge1_precision_stderr": 0.0032402613188758484, "rouge1_recall": 0.4154073794853628, "rouge1_recall_stderr": 0.0029811452241909936, "rouge2_fmeasure": 0.20120573159323082, "rouge2_fmeasure_stderr": 0.0019466830589320579, "rouge2_precision": 0.24440729108549972, "rouge2_precision_stderr": 0.0025713353876726987, "rouge2_recall": 0.1903569141394937, "rouge2_recall_stderr": 0.002085369890907639, "rougeL_fmeasure": 0.31512942959617346, "rougeL_fmeasure_stderr": 0.0020245073951865498, "rougeL_precision": 0.3797441094381383, "rougeL_precision_stderr": 0.002849422577384458, "rougeL_recall": 0.2977661478395331, "rougeL_recall_stderr": 0.0023832352149522175, "rougeLsum_fmeasure": 0.35586936216582027, "rougeLsum_fmeasure_stderr": 0.002288936359442796, "rougeLsum_precision": 0.4269573872984081, "rougeLsum_precision_stderr": 0.003094947485413177, "rougeLsum_recall": 0.33674441043750625, "rougeLsum_recall_stderr": 0.00269773822444997}}, "2": {"generate_text_restaurant": {"bleu": 13.376126264980714, "bleu_stderr": 0.2423138700015996, "rouge1_fmeasure": 0.47582339525157197, "rouge1_fmeasure_stderr": 0.0022765247887398116, "rouge1_precision": 0.5586896631262273, "rouge1_precision_stderr": 0.0032542273894082263, "rouge1_recall": 0.4534492320208494, "rouge1_recall_stderr": 0.0029116157123098745, "rouge2_fmeasure": 0.23204546503817813, "rouge2_fmeasure_stderr": 0.002046713809774589, "rouge2_precision": 0.27694841097623996, "rouge2_precision_stderr": 0.002758389324353955, "rouge2_recall": 0.2206909261465891, "rouge2_recall_stderr": 0.0021891415728379693, "rougeL_fmeasure": 0.34446258237680916, "rougeL_fmeasure_stderr": 0.0020760578430186376, "rougeL_precision": 0.40753042690914904, "rougeL_precision_stderr": 0.002988569615037221, "rougeL_recall": 0.3271426648953936, "rougeL_recall_stderr": 0.002412434421850288, "rougeLsum_fmeasure": 0.39054726501758946, "rougeLsum_fmeasure_stderr": 0.002301771792227363, "rougeLsum_precision": 0.4602485572678633, "rougeLsum_precision_stderr": 0.003204122515744201, "rougeLsum_recall": 0.3712619134780482, "rougeLsum_recall_stderr": 0.0026876195742092054}}, "3": {"generate_text_restaurant": {"bleu": 14.093165522897872, "bleu_stderr": 0.21216386354546166, "rouge1_fmeasure": 0.4785676515677228, "rouge1_fmeasure_stderr": 0.0022234504082830633, "rouge1_precision": 0.5387233761250629, "rouge1_precision_stderr": 0.0031864759527455624, "rouge1_recall": 0.4726895100996329, "rouge1_recall_stderr": 0.002899854544961585, "rouge2_fmeasure": 0.23558342825678338, "rouge2_fmeasure_stderr": 0.002030621156209231, "rouge2_precision": 0.2685393636176561, "rouge2_precision_stderr": 0.0026170967343239477, "rouge2_recall": 0.23277587897646693, "rouge2_recall_stderr": 0.0022527763377626336, "rougeL_fmeasure": 0.34641516486003826, "rougeL_fmeasure_stderr": 0.0020831944107613303, "rougeL_precision": 0.39161805848668024, "rougeL_precision_stderr": 0.002876699759638117, "rougeL_recall": 0.34175514874890695, "rougeL_recall_stderr": 0.0024862399492205957, "rougeLsum_fmeasure": 0.3965640250353348, "rougeLsum_fmeasure_stderr": 0.0022751928578861502, "rougeLsum_precision": 0.44704833712523245, "rougeLsum_precision_stderr": 0.003092169155791799, "rougeLsum_recall": 0.3913487563855888, "rougeLsum_recall_stderr": 0.0027430209943532587}}, "4": {"generate_text_restaurant": {"bleu": 13.01877522701202, "bleu_stderr": 0.1634606411416184, "rouge1_fmeasure": 0.47017887879088466, "rouge1_fmeasure_stderr": 0.00215775715520141, "rouge1_precision": 0.4967367435501768, "rouge1_precision_stderr": 0.002997180519517344, "rouge1_recall": 0.48986433299719573, "rouge1_recall_stderr": 0.0028919527625229664, "rouge2_fmeasure": 0.2285190900484798, "rouge2_fmeasure_stderr": 0.001968236514909628, "rouge2_precision": 0.24350630882815852, "rouge2_precision_stderr": 0.002422719426969184, "rouge2_recall": 0.2387594057692899, "rouge2_recall_stderr": 0.0022672859667634986, "rougeL_fmeasure": 0.3311043111563345, "rougeL_fmeasure_stderr": 0.001975651372330419, "rougeL_precision": 0.3508199102140834, "rougeL_precision_stderr": 0.002597964369996749, "rougeL_recall": 0.34517696947416515, "rougeL_recall_stderr": 0.0024767421656897485, "rougeLsum_fmeasure": 0.3879654204025311, "rougeLsum_fmeasure_stderr": 0.00222102600090257, "rougeLsum_precision": 0.4096834114721446, "rougeLsum_precision_stderr": 0.0028584575443569072, "rougeLsum_recall": 0.4045460483730194, "rougeLsum_recall_stderr": 0.002787010565242438}}, "5": {"generate_text_restaurant": {"bleu": 11.738533814250154, "bleu_stderr": 0.20692029359403782, "rouge1_fmeasure": 0.4579176439966838, "rouge1_fmeasure_stderr": 0.0019838649103218315, "rouge1_precision": 0.4557324007548413, "rouge1_precision_stderr": 0.0026141133736043063, "rouge1_recall": 0.5008190200746241, "rouge1_recall_stderr": 0.0027912701451645113, "rouge2_fmeasure": 0.21699681614941907, "rouge2_fmeasure_stderr": 0.0018260134934355917, "rouge2_precision": 0.21649241809836905, "rouge2_precision_stderr": 0.0020808047468387015, "rouge2_recall": 0.23946332773224333, "rouge2_recall_stderr": 0.0022622492821207474, "rougeL_fmeasure": 0.3204737144833669, "rougeL_fmeasure_stderr": 0.0018416039122686005, "rougeL_precision": 0.31896738977233224, "rougeL_precision_stderr": 0.002249879972490852, "rougeL_recall": 0.3516931047967278, "rougeL_recall_stderr": 0.0024669281840779384, "rougeLsum_fmeasure": 0.38110492282903374, "rougeLsum_fmeasure_stderr": 0.0020518013347156708, "rougeLsum_precision": 0.3790705627204969, "rougeLsum_precision_stderr": 0.0024962460456464603, "rougeLsum_recall": 0.4171792042608784, "rougeLsum_recall_stderr": 0.0027157128707540365}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 2.2151365071026334, "bleu_stderr": 0.10551243625041298, "rouge1_fmeasure": 0.2173222672616331, "rouge1_fmeasure_stderr": 0.0026735963951633086, "rouge1_precision": 0.17320559498489507, "rouge1_precision_stderr": 0.0025525024097035748, "rouge1_recall": 0.33568511811329627, "rouge1_recall_stderr": 0.004457272030335943, "rouge2_fmeasure": 0.05119317937818865, "rouge2_fmeasure_stderr": 0.0016915277669349944, "rouge2_precision": 0.03984347722138949, "rouge2_precision_stderr": 0.0014498730660041778, "rouge2_recall": 0.08293611853648174, "rouge2_recall_stderr": 0.0027922604769135967, "rougeL_fmeasure": 0.16413944160730887, "rougeL_fmeasure_stderr": 0.0020492207241516436, "rougeL_precision": 0.1306308027797899, "rougeL_precision_stderr": 0.001979750535716133, "rougeL_recall": 0.25481924486600754, "rougeL_recall_stderr": 0.0034477504419509046, "rougeLsum_fmeasure": 0.17170031392993537, "rougeLsum_fmeasure_stderr": 0.002265881556419863, "rougeLsum_precision": 0.13618964667417757, "rougeLsum_precision_stderr": 0.0020883754136888665, "rougeLsum_recall": 0.2671983620973551, "rougeLsum_recall_stderr": 0.0038518682770408703}}, "1": {"article_DOC_summary": {"bleu": 1.5874448429909755, "bleu_stderr": 0.07657449929611179, "rouge1_fmeasure": 0.18543200867192464, "rouge1_fmeasure_stderr": 0.0024553301715842025, "rouge1_precision": 0.13193321373947423, "rouge1_precision_stderr": 0.0018249214408045705, "rouge1_recall": 0.32491663088067385, "rouge1_recall_stderr": 0.004280533648795701, "rouge2_fmeasure": 0.04099230088578755, "rouge2_fmeasure_stderr": 0.0014846354986486204, "rouge2_precision": 0.02885078338766851, "rouge2_precision_stderr": 0.0010494871344340587, "rouge2_recall": 0.07423283049608298, "rouge2_recall_stderr": 0.0027810291758957346, "rougeL_fmeasure": 0.14626844109613504, "rougeL_fmeasure_stderr": 0.0018773361178004498, "rougeL_precision": 0.10387006177524372, "rougeL_precision_stderr": 0.0013802990359211345, "rougeL_recall": 0.2578619666146113, "rougeL_recall_stderr": 0.003428735324171146, "rougeLsum_fmeasure": 0.1472004999527075, "rougeLsum_fmeasure_stderr": 0.0020688083081768726, "rougeLsum_precision": 0.10445447840702451, "rougeLsum_precision_stderr": 0.001509990224349501, "rougeLsum_recall": 0.2598290086664842, "rougeLsum_recall_stderr": 0.0037495698358454184}}, "2": {"article_DOC_summary": {"bleu": 1.620400084032387, "bleu_stderr": 0.1036187597036037, "rouge1_fmeasure": 0.18753394533546663, "rouge1_fmeasure_stderr": 0.0024632687591213827, "rouge1_precision": 0.13378369552141486, "rouge1_precision_stderr": 0.001828879330748606, "rouge1_recall": 0.32737811206091777, "rouge1_recall_stderr": 0.004306408194620798, "rouge2_fmeasure": 0.04246731521010523, "rouge2_fmeasure_stderr": 0.0014710047875479853, "rouge2_precision": 0.0299925935097244, "rouge2_precision_stderr": 0.0010381433997656876, "rouge2_recall": 0.07593086345843493, "rouge2_recall_stderr": 0.0027442526221015794, "rougeL_fmeasure": 0.14937612301640457, "rougeL_fmeasure_stderr": 0.0018862901936057773, "rougeL_precision": 0.10643964494355733, "rougeL_precision_stderr": 0.0013938532111114862, "rougeL_recall": 0.26198866539949395, "rougeL_recall_stderr": 0.0034185812335638674, "rougeLsum_fmeasure": 0.14706588908674015, "rougeLsum_fmeasure_stderr": 0.0020537944843788485, "rougeLsum_precision": 0.10465900735165316, "rougeLsum_precision_stderr": 0.0014985247658685268, "rougeLsum_recall": 0.25870432987334707, "rougeLsum_recall_stderr": 0.0037543234582558148}}, "3": {"article_DOC_summary": {"bleu": 1.6556986327135799, "bleu_stderr": 0.09408085446538644, "rouge1_fmeasure": 0.181742673631377, "rouge1_fmeasure_stderr": 0.0026996346996907114, "rouge1_precision": 0.1325857147512653, "rouge1_precision_stderr": 0.002104582538451698, "rouge1_recall": 0.310270163693354, "rouge1_recall_stderr": 0.004622235270535744, "rouge2_fmeasure": 0.041996639319967895, "rouge2_fmeasure_stderr": 0.0014924431333982891, "rouge2_precision": 0.030071518934551324, "rouge2_precision_stderr": 0.0010760225740262315, "rouge2_recall": 0.07399993568063115, "rouge2_recall_stderr": 0.0027512935104685335, "rougeL_fmeasure": 0.1455139114170652, "rougeL_fmeasure_stderr": 0.002103135242813012, "rougeL_precision": 0.10572519383258887, "rougeL_precision_stderr": 0.001594887821630211, "rougeL_recall": 0.24999311515441475, "rougeL_recall_stderr": 0.0037295235353239403, "rougeLsum_fmeasure": 0.1443734491656482, "rougeLsum_fmeasure_stderr": 0.002242271836640455, "rougeLsum_precision": 0.10501603221104056, "rougeLsum_precision_stderr": 0.0017119294258030526, "rougeLsum_recall": 0.24836824871710267, "rougeLsum_recall_stderr": 0.003968401031348439}}, "4": {"article_DOC_summary": {"bleu": 0.8787323538547989, "bleu_stderr": 0.09806037997681721, "rouge1_fmeasure": 0.051203664083526064, "rouge1_fmeasure_stderr": 0.002916215578123627, "rouge1_precision": 0.04185793101612411, "rouge1_precision_stderr": 0.0025354871639657332, "rouge1_recall": 0.07960189442566881, "rouge1_recall_stderr": 0.004594099676529609, "rouge2_fmeasure": 0.012145091480254444, "rouge2_fmeasure_stderr": 0.001038605071999789, "rouge2_precision": 0.009545271254314988, "rouge2_precision_stderr": 0.0009027168872299666, "rouge2_recall": 0.019489192736000506, "rouge2_recall_stderr": 0.0016525733661952122, "rougeL_fmeasure": 0.040479741202891835, "rougeL_fmeasure_stderr": 0.0022777830898179745, "rougeL_precision": 0.03331696824804232, "rougeL_precision_stderr": 0.002048247078605598, "rougeL_recall": 0.06320111546579645, "rougeL_recall_stderr": 0.0036120398264049094, "rougeLsum_fmeasure": 0.041001723419299384, "rougeLsum_fmeasure_stderr": 0.0023481586557545764, "rougeLsum_precision": 0.033884182850020796, "rougeLsum_precision_stderr": 0.0021113829994884406, "rougeLsum_recall": 0.0637408678817515, "rougeLsum_recall_stderr": 0.003715585442877857}}, "5": {"article_DOC_summary": {"bleu": 6.480764426251045e-36, "bleu_stderr": 1.6529080147588964e-30, "rouge1_fmeasure": 0.003279934928320664, "rouge1_fmeasure_stderr": 0.0009428534366320934, "rouge1_precision": 0.003661405957465891, "rouge1_precision_stderr": 0.0010410174134967514, "rouge1_recall": 0.003073378808572809, "rouge1_recall_stderr": 0.0008998604189966408, "rouge2_fmeasure": 0.0007405035248494208, "rouge2_fmeasure_stderr": 0.00038311030521319677, "rouge2_precision": 0.0007725002522449804, "rouge2_precision_stderr": 0.0003775496435431225, "rouge2_recall": 0.0007322912012146197, "rouge2_recall_stderr": 0.0003972475356359937, "rougeL_fmeasure": 0.0021896510504014074, "rougeL_fmeasure_stderr": 0.0006251341441438973, "rougeL_precision": 0.002439909640242604, "rougeL_precision_stderr": 0.0006917842321148266, "rougeL_recall": 0.0020657262287064482, "rougeL_recall_stderr": 0.000601437175466453, "rougeLsum_fmeasure": 0.0026863003460885, "rougeLsum_fmeasure_stderr": 0.0007784026207598828, "rougeLsum_precision": 0.0030026261505173824, "rougeLsum_precision_stderr": 0.0008643214712623419, "rougeLsum_recall": 0.002523952641616138, "rougeLsum_recall_stderr": 0.0007458033281437961}}}} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..712ece6c18c23cde1089eed91b85ac40c42ee0b7 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3463387125507984, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03871898741816671 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07211255715607569, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001551406165163628 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2996849092736172, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004583023786340968 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10952539068797028, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019907747077539725 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03381420888180137, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008950985117036589 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.14844147775806338, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032200950902031658 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05201678241725894, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012570598168046025 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06953968025004763, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014395600092792235 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2927861422575508, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004486869628532065 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10599044553263734, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001858626781810144 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06905492701097961, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014675622764115906 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.28799521128404415, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004338230779660113 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10494341774143819, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018712967363079748 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f58c5cf4f9951a59cfbe5e8b03693043e477889a --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.49152208622242877, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04139408950745415 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07373625415642708, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013444564112333292 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3753665468025263, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00536016010380475 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11542248804126877, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001852315570556662 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03437112478262944, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008158271460114628 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1839462343866126, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003709671721946962 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05396039097370975, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011621890988087783 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06891381858838289, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00117848640155061 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3513896637107432, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004856217872136033 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1080526825836882, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016391879678756425 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07022268782208652, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012677785220343175 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3548574219712635, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004914558194954389 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10983109806282532, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017465824716290605 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e7384e006b308a782034997bbd6da3a3661b480e --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5036165898830023, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03163382931247645 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07345117313274237, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012208182117261878 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3941081050839388, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005139991780948632 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11611735091169018, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016856649398913782 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03416030472845622, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007497324529078045 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1960695205229479, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00374456566803786 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.0542677230188957, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001076889081745943 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06848596200566257, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001088456262302762 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3641445841455221, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004555374452263096 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10822818662084129, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015080010309372358 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06991710191369618, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.00115124520295404 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.37308280267746685, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004752608689239747 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11045227449849929, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015880076943480838 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..5a256f7626f3d5867ff7878238afa3b4797478b0 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6498113531541159, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.044359939496823625 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07362728433969368, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012506969519923664 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.40433747874257164, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00532349382454595 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11670639827568505, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017228506693859023 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03462285279213432, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007700688556812641 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20446580518938245, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038704073812126957 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.055174784608656414, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001103480731304987 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06807883372554288, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011054577780329877 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.369498755496309, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004606643368535042 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10780699471813608, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015196469475095016 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06987690204692998, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001181829372472824 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.38020527679899335, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004841997364585111 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11062957727513113, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016229376323127634 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..fba2d3f551e69e7efc2dfea42014f488ca67d82a --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6676812083161542, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04984003951128037 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07419859091894718, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012073720133260548 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4115156265704582, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005279248235847037 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11795519287394977, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001663656872341927 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03509931891578484, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007461921191218064 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21194614881093146, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003942396709196514 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05617955897318711, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001072962808033341 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.0683956812460672, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010554662078452836 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.37604842524473375, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004602132355576208 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10867138834194551, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014576101979114201 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07053184039179991, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011422521869853676 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3893450058485989, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004865697961495776 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11206081323499055, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001572212563142291 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..4dedf463de73ab0cfe0cdd8e33322cb407972b80 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7710974467285127, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05203704839844347 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07425806182657936, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0011956495019689597 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.42780274108203253, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005406944243614746 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11877703066041605, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016491364267747024 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03492035728514057, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000728989115137721 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.22003827942872525, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004025013823319427 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05625150089671772, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010511709925049085 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06747232289163295, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001034208622107367 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3846963659749557, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004603801517001138 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10772149028740496, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014157977593889726 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07017346453232838, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001136713184580948 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.40087756811378206, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004939981502609751 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11204458204469926, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015584717483504628 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e4b33d3f14ed9ca7934586521b82337a947a4359 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15426863660325024, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019390767016899475 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.26616584906943935, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002800247123213755 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18179483366438334, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001918528213130623 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.032398604164030766, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007853568426710733 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.059178979799423694, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015378959605561995 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03857873002486118, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008912625012118423 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1178409029648999, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00134426120796486 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.21156320512029583, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002302858626762558 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14062571654868716, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013664451991987955 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.14121341341165533, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017607776877685353 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.24535304568196398, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026196185425979572 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1667428911480839, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017491099585958065 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.7317879218324492, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06258434310865753 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..860737b04fd4a0e85c12bebe0ce1f0a6ff0f5242 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.2097374056236598, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002558792591642619 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.31993230192333455, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002912578847069188 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.22615743170046998, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019675759971617946 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.05460829335196789, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0013104520035504465 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.08436597375871419, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0018136264810112849 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05788753426578909, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011036642735696503 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.14966153212559197, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0019100435840523184 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.23314632888007986, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002308314606066584 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.16096845678834487, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013344427734486718 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1969300454898004, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002419281823679596 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.3015516742807266, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027852344656345953 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.21248946284679468, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001850444919705845 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.078946318578733, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.037508376634953426 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..da324ca68b1d716a2adf16145e2b57116fcb0e8f --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.2249179940170448, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002953091033379103 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.30791265980488064, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028052680018540153 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.22500809081344597, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019395777660833832 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.06082816124882105, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0015517487698999066 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.08191649217784704, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0017207233219242591 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.058940718015282535, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011427794692985003 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1651950475417842, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0023849745375518774 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.22637843422800283, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002257218203318618 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1629946491305722, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001412842903446524 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.21271781118896244, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0027972927699949795 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.29203959550294045, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002679740707668158 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.21287275166909125, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001828524451639913 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.331365912474371, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03901431585240638 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..6ec10c473a68feabfe2ff4e65e105bf9547084a9 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1984883398198494, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.003387900153458854 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2444675402553931, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.003332060879697036 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1828984280612045, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00233789023320496 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.05494653639366956, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00172026049377679 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06573981524186268, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001646361012922936 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.048423081518600516, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011278965656492843 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.14973545109772782, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002771115067407858 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1820828761022503, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002594908370622835 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13482403873394622, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017315326993232382 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1876688685476534, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003222108012150837 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.23146444735253652, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.003170383006624478 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1727178547993039, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022030460306759693 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.4654459013677066, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09533106520935124 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..d7042dd6f5a08d45a5ddd679ec5e2080e845e0b5 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.06373323883393266, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0025948109156841556 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.07974114305386926, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002852169393376925 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.057249298351433005, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001981710879314234 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.017183606562936146, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001165303674699654 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.021451383479229473, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00115814797861179 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.014679683423748945, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007250006064285315 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.049676263167134256, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0021317796688731104 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.061127221909033094, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022295833532602533 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.04339902158323832, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014931210623861644 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.059918160107108445, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002458251392796141 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.07475299437390277, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026852062028548873 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.05356492994210666, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018539473478258858 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.5096514625512257, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04746911438860582 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..088ddebe0732961c7c380e99d2b3c5b5e012cdaa --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.00974635222327858, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0010426157804008867 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.013305767376845547, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.001294486365694067 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.009381663500620675, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0009033228148794374 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0027541706176161013, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0004991531053543725 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0034881657779112446, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0004828260114230198 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.002426218955168773, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00032099513562133 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.007558937884226414, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0008514792129217634 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.010297022985567691, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0010209752122782392 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.007132684824681642, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006849988631397933 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.00925164902439946, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001003429166331945 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.012522528933544396, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0012265948088620682 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.008824412648201954, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0008523533756253951 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.4367817796838913e-07, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 5.931740679366216e-07 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a35533db685ca9f2cf8ada8354f3a624e02b004f --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 1.4674593008700727, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.07690373053792376 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.05683753991737235, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0014560506575201325 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.08937391024861521, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002366915901253559 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.06377803506212068, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.001672122677396593 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.012214590726895359, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0005743247716736654 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.021379218732414145, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0009966104546792834 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.015238638354519577, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0007071169872858592 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.05347894988195794, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0013049823564136975 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.08437384990508254, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0021538312776559535 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.059880641876164487, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0014895688210922907 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.05199652967109443, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.001336335232731129 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.08011650518165435, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0021036901960562 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.057561121270217515, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0014995174600948955 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..0f50861aa3489e62a3b4e02655effc70d1b1383f --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.256639255609565, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.13909119146023038 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5241369762469382, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032402613188758484 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4154073794853628, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029811452241909936 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.43826153885312474, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0023680361634807615 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.24440729108549972, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0025713353876726987 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1903569141394937, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002085369890907639 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.20120573159323082, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019466830589320579 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3797441094381383, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002849422577384458 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.2977661478395331, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023832352149522175 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.31512942959617346, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020245073951865498 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4269573872984081, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003094947485413177 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.33674441043750625, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.00269773822444997 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.35586936216582027, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002288936359442796 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..15b2ed93cd32217ac4e0975dec1e9f871be34919 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.376126264980714, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.2423138700015996 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5586896631262273, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032542273894082263 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4534492320208494, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029116157123098745 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.47582339525157197, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022765247887398116 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.27694841097623996, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002758389324353955 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2206909261465891, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021891415728379693 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23204546503817813, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002046713809774589 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.40753042690914904, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002988569615037221 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3271426648953936, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002412434421850288 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34446258237680916, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020760578430186376 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4602485572678633, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003204122515744201 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3712619134780482, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026876195742092054 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.39054726501758946, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002301771792227363 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..969eef8d5ab72880b596fbd699c4c57fdac54b4f --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.093165522897872, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.21216386354546166 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5387233761250629, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031864759527455624 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4726895100996329, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002899854544961585 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4785676515677228, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022234504082830633 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2685393636176561, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026170967343239477 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.23277587897646693, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022527763377626336 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23558342825678338, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002030621156209231 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.39161805848668024, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002876699759638117 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.34175514874890695, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024862399492205957 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34641516486003826, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020831944107613303 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.44704833712523245, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003092169155791799 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3913487563855888, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027430209943532587 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3965640250353348, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022751928578861502 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..248481a4833cac302fc90996853f3c89c4e3d456 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.01877522701202, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1634606411416184 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4967367435501768, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002997180519517344 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.48986433299719573, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028919527625229664 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.47017887879088466, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.00215775715520141 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.24350630882815852, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002422719426969184 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2387594057692899, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022672859667634986 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2285190900484798, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001968236514909628 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3508199102140834, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002597964369996749 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.34517696947416515, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024767421656897485 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3311043111563345, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001975651372330419 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4096834114721446, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0028584575443569072 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4045460483730194, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002787010565242438 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3879654204025311, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00222102600090257 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b523aebce75e32ec63df615f493c96e593c40816 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.738533814250154, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.20692029359403782 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4557324007548413, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0026141133736043063 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.5008190200746241, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027912701451645113 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4579176439966838, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0019838649103218315 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.21649241809836905, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0020808047468387015 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.23946332773224333, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022622492821207474 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.21699681614941907, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018260134934355917 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.31896738977233224, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002249879972490852 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3516931047967278, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024669281840779384 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3204737144833669, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0018416039122686005 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3790705627204969, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0024962460456464603 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4171792042608784, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027157128707540365 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.38110492282903374, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020518013347156708 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_0.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..83d5ee391d233ee57515b0bba9d4a42718d40221 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.17320559498489507, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0025525024097035748 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.33568511811329627, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004457272030335943 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2173222672616331, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026735963951633086 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03984347722138949, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0014498730660041778 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.08293611853648174, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027922604769135967 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.05119317937818865, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0016915277669349944 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1306308027797899, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001979750535716133 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.25481924486600754, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034477504419509046 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.16413944160730887, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020492207241516436 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.13618964667417757, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0020883754136888665 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2671983620973551, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0038518682770408703 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.17170031392993537, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002265881556419863 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.2151365071026334, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.10551243625041298 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_1.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..be8fe1d4bdb81dcbb983242a84307e2076ea2466 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.13193321373947423, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018249214408045705 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.32491663088067385, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004280533648795701 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.18543200867192464, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024553301715842025 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02885078338766851, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010494871344340587 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07423283049608298, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027810291758957346 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04099230088578755, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014846354986486204 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10387006177524372, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013802990359211345 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2578619666146113, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003428735324171146 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14626844109613504, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018773361178004498 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10445447840702451, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001509990224349501 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2598290086664842, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0037495698358454184 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1472004999527075, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020688083081768726 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.5874448429909755, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07657449929611179 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_2.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..963a60078bfa379dbc2635170f592f3cbed24693 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.13378369552141486, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.001828879330748606 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.32737811206091777, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004306408194620798 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.18753394533546663, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024632687591213827 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0299925935097244, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010381433997656876 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07593086345843493, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027442526221015794 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04246731521010523, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014710047875479853 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10643964494355733, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013938532111114862 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.26198866539949395, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034185812335638674 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14937612301640457, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018862901936057773 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10465900735165316, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014985247658685268 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.25870432987334707, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0037543234582558148 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14706588908674015, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020537944843788485 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.620400084032387, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.1036187597036037 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_3.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..d810a5fcf303966e8a1b03ce5eccf750c629dac4 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1325857147512653, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002104582538451698 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.310270163693354, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004622235270535744 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.181742673631377, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026996346996907114 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.030071518934551324, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010760225740262315 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07399993568063115, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027512935104685335 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.041996639319967895, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014924431333982891 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10572519383258887, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001594887821630211 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24999311515441475, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0037295235353239403 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1455139114170652, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002103135242813012 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10501603221104056, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0017119294258030526 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24836824871710267, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003968401031348439 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1443734491656482, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002242271836640455 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.6556986327135799, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09408085446538644 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_4.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b93999343b403faa254fe1e679ded077ca6e330d --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.04185793101612411, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0025354871639657332 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.07960189442566881, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004594099676529609 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.051203664083526064, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002916215578123627 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.009545271254314988, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009027168872299666 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.019489192736000506, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0016525733661952122 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.012145091480254444, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001038605071999789 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.03331696824804232, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.002048247078605598 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.06320111546579645, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0036120398264049094 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.040479741202891835, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0022777830898179745 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.033884182850020796, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0021113829994884406 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0637408678817515, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003715585442877857 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.041001723419299384, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0023481586557545764 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.8787323538547989, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09806037997681721 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_5.json b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..e526efbe13dd13df0e55182ee37ceaf6699fe879 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/generation/slim.4b284b84bc4seed2_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.003661405957465891, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0010410174134967514 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.003073378808572809, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0008998604189966408 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.003279934928320664, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0009428534366320934 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0007725002522449804, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0003775496435431225 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0007322912012146197, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0003972475356359937 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0007405035248494208, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00038311030521319677 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.002439909640242604, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0006917842321148266 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0020657262287064482, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.000601437175466453 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0021896510504014074, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0006251341441438973 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0030026261505173824, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0008643214712623419 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.002523952641616138, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0007458033281437961 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0026863003460885, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0007784026207598828 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 6.480764426251045e-36, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 1.6529080147588964e-30 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_0.csv b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..f6afb690bf1b5c24059cdc0016dbb43cc36ca9ec --- /dev/null +++ b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.332,0.014899597242811482,0 +anli_r2,acc,0.34,0.014987482264363937,0 +anli_r3,acc,0.3375,0.013655897185463658,0 +arc_challenge,acc,0.2764505119453925,0.013069662474252425,0 +arc_challenge,acc_norm,0.29266211604095566,0.01329591610361942,0 +arc_easy,acc,0.6165824915824916,0.009976995068264716,0 +arc_easy,acc_norm,0.5395622895622896,0.010227616386289017,0 +boolq,acc,0.5960244648318043,0.008582268854021406,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.1940928270042194,,1 +copa,acc,0.77,0.04229525846816506,0 +hellaswag,acc,0.48157737502489545,0.004986393266269168,0 +hellaswag,acc_norm,0.629555865365465,0.004819367172685975,0 +piqa,acc,0.7551686615886833,0.010032309105568795,0 +piqa,acc_norm,0.7693144722524483,0.009828959550983096,0 +rte,acc,0.5342960288808665,0.030025579819366426,0 +sciq,acc,0.852,0.011234866364235237,0 +sciq,acc_norm,0.768,0.013354937452281567,0 +storycloze_2016,acc,0.7194013896312133,0.010389809647288821,0 +winogrande,acc,0.5864246250986582,0.013840971763195304,0 diff --git a/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_0.json b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_0.json new file mode 100644 index 0000000000000000000000000000000000000000..79cf2fb9589ccf103f06cff4bd7e26a05eb6b446 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811482 + }, + "anli_r2": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r3": { + "acc": 0.3375, + "acc_stderr": 0.013655897185463658 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.1940928270042194 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.48157737502489545, + "acc_stderr": 0.004986393266269168, + "acc_norm": 0.629555865365465, + "acc_norm_stderr": 0.004819367172685975 + }, + "rte": { + "acc": 0.5342960288808665, + "acc_stderr": 0.030025579819366426 + }, + "winogrande": { + "acc": 0.5864246250986582, + "acc_stderr": 0.013840971763195304 + }, + "storycloze_2016": { + "acc": 0.7194013896312133, + "acc_stderr": 0.010389809647288821 + }, + "boolq": { + "acc": 0.5960244648318043, + "acc_stderr": 0.008582268854021406 + }, + "arc_easy": { + "acc": 0.6165824915824916, + "acc_stderr": 0.009976995068264716, + "acc_norm": 0.5395622895622896, + "acc_norm_stderr": 0.010227616386289017 + }, + "arc_challenge": { + "acc": 0.2764505119453925, + "acc_stderr": 0.013069662474252425, + "acc_norm": 0.29266211604095566, + "acc_norm_stderr": 0.01329591610361942 + }, + "sciq": { + "acc": 0.852, + "acc_stderr": 0.011234866364235237, + "acc_norm": 0.768, + "acc_norm_stderr": 0.013354937452281567 + }, + "piqa": { + "acc": 0.7551686615886833, + "acc_stderr": 0.010032309105568795, + "acc_norm": 0.7693144722524483, + "acc_norm_stderr": 0.009828959550983096 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_1.csv b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..31f02c9ae67ce29b96b551ae10a29742d206049e --- /dev/null +++ b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.342,0.015008706182121731,0 +anli_r2,acc,0.333,0.01491084616422987,0 +anli_r3,acc,0.3425,0.013704669762934723,0 +arc_challenge,acc,0.28071672354948807,0.013131238126975574,0 +arc_challenge,acc_norm,0.31569965870307165,0.013582571095815291,0 +arc_easy,acc,0.6296296296296297,0.009908978578665757,0 +arc_easy,acc_norm,0.5955387205387206,0.01007074664827879,0 +boolq,acc,0.6180428134556575,0.008497851998427189,1 +cb,acc,0.39285714285714285,0.0658538889806635,1 +cb,f1,0.19555555555555557,,1 +copa,acc,0.74,0.0440844002276808,0 +hellaswag,acc,0.477096195976897,0.004984543540932341,0 +hellaswag,acc_norm,0.6266679944234216,0.004827006520802888,0 +piqa,acc,0.7519042437431991,0.010077118315574717,0 +piqa,acc_norm,0.7627856365614799,0.00992469493358637,0 +rte,acc,0.5523465703971119,0.02993107036293953,0 +sciq,acc,0.908,0.009144376393151113,0 +sciq,acc_norm,0.89,0.009899393819724444,0 +storycloze_2016,acc,0.7108498129342598,0.010484068799942072,0 +winogrande,acc,0.5911602209944752,0.01381695429513569,0 diff --git a/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_1.json b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_1.json new file mode 100644 index 0000000000000000000000000000000000000000..272618276751cd954d034e8356e3c85ce3da0bca --- /dev/null +++ b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.342, + "acc_stderr": 0.015008706182121731 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.01491084616422987 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934723 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.19555555555555557 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.0440844002276808 + }, + "hellaswag": { + "acc": 0.477096195976897, + "acc_stderr": 0.004984543540932341, + "acc_norm": 0.6266679944234216, + "acc_norm_stderr": 0.004827006520802888 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.02993107036293953 + }, + "winogrande": { + "acc": 0.5911602209944752, + "acc_stderr": 0.01381695429513569 + }, + "storycloze_2016": { + "acc": 0.7108498129342598, + "acc_stderr": 0.010484068799942072 + }, + "boolq": { + "acc": 0.6180428134556575, + "acc_stderr": 0.008497851998427189 + }, + "arc_easy": { + "acc": 0.6296296296296297, + "acc_stderr": 0.009908978578665757, + "acc_norm": 0.5955387205387206, + "acc_norm_stderr": 0.01007074664827879 + }, + "arc_challenge": { + "acc": 0.28071672354948807, + "acc_stderr": 0.013131238126975574, + "acc_norm": 0.31569965870307165, + "acc_norm_stderr": 0.013582571095815291 + }, + "sciq": { + "acc": 0.908, + "acc_stderr": 0.009144376393151113, + "acc_norm": 0.89, + "acc_norm_stderr": 0.009899393819724444 + }, + "piqa": { + "acc": 0.7519042437431991, + "acc_stderr": 0.010077118315574717, + "acc_norm": 0.7627856365614799, + "acc_norm_stderr": 0.00992469493358637 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_2.csv b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..160eee85a6bb21d5d93ebaa24d9aae55ee113cfb --- /dev/null +++ b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.34,0.014987482264363935,0 +anli_r2,acc,0.323,0.014794927843348633,0 +anli_r3,acc,0.33416666666666667,0.01362243481313678,0 +arc_challenge,acc,0.2960750853242321,0.01334091608524626,0 +arc_challenge,acc_norm,0.3165529010238908,0.013592431519068079,0 +arc_easy,acc,0.6346801346801347,0.009880576614806924,0 +arc_easy,acc_norm,0.6047979797979798,0.010031894052790978,0 +boolq,acc,0.634862385321101,0.008420941009417812,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.21597096188747733,,1 +copa,acc,0.78,0.04163331998932261,0 +hellaswag,acc,0.47470623381796456,0.004983392650570956,0 +hellaswag,acc_norm,0.6288587930691097,0.0048212280346248615,0 +piqa,acc,0.7475516866158868,0.010135665547362364,0 +piqa,acc_norm,0.7633297062023939,0.009916841655042809,0 +rte,acc,0.51985559566787,0.030072723167317177,0 +sciq,acc,0.917,0.008728527206074792,0 +sciq,acc_norm,0.904,0.00932045443478322,0 +storycloze_2016,acc,0.7215392838054516,0.010365521460604429,0 +winogrande,acc,0.5943172849250198,0.01380020633601421,0 diff --git a/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_2.json b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_2.json new file mode 100644 index 0000000000000000000000000000000000000000..97cc7267089f6055cf0dd4775d3c79eeba44b4ae --- /dev/null +++ b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363935 + }, + "anli_r2": { + "acc": 0.323, + "acc_stderr": 0.014794927843348633 + }, + "anli_r3": { + "acc": 0.33416666666666667, + "acc_stderr": 0.01362243481313678 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.21597096188747733 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932261 + }, + "hellaswag": { + "acc": 0.47470623381796456, + "acc_stderr": 0.004983392650570956, + "acc_norm": 0.6288587930691097, + "acc_norm_stderr": 0.0048212280346248615 + }, + "rte": { + "acc": 0.51985559566787, + "acc_stderr": 0.030072723167317177 + }, + "winogrande": { + "acc": 0.5943172849250198, + "acc_stderr": 0.01380020633601421 + }, + "storycloze_2016": { + "acc": 0.7215392838054516, + "acc_stderr": 0.010365521460604429 + }, + "boolq": { + "acc": 0.634862385321101, + "acc_stderr": 0.008420941009417812 + }, + "arc_easy": { + "acc": 0.6346801346801347, + "acc_stderr": 0.009880576614806924, + "acc_norm": 0.6047979797979798, + "acc_norm_stderr": 0.010031894052790978 + }, + "arc_challenge": { + "acc": 0.2960750853242321, + "acc_stderr": 0.01334091608524626, + "acc_norm": 0.3165529010238908, + "acc_norm_stderr": 0.013592431519068079 + }, + "sciq": { + "acc": 0.917, + "acc_stderr": 0.008728527206074792, + "acc_norm": 0.904, + "acc_norm_stderr": 0.00932045443478322 + }, + "piqa": { + "acc": 0.7475516866158868, + "acc_stderr": 0.010135665547362364, + "acc_norm": 0.7633297062023939, + "acc_norm_stderr": 0.009916841655042809 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_3.csv b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..3f0d5cee77e63cb490a6e3e1dab083be39834fdf --- /dev/null +++ b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.337,0.014955087918653602,0 +anli_r2,acc,0.335,0.014933117490932579,0 +anli_r3,acc,0.34833333333333333,0.013759437498874082,0 +arc_challenge,acc,0.28754266211604096,0.013226719056266129,0 +arc_challenge,acc_norm,0.2986348122866894,0.013374078615068752,0 +arc_easy,acc,0.6317340067340067,0.009897286209010894,0 +arc_easy,acc_norm,0.6220538720538721,0.009949405744045481,0 +boolq,acc,0.6235474006116208,0.008473882279194591,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.2780390107976315,,1 +copa,acc,0.79,0.040936018074033256,0 +hellaswag,acc,0.4759012148974308,0.004983982396187369,0 +hellaswag,acc_norm,0.6304521011750648,0.004816958817726088,0 +piqa,acc,0.7546245919477693,0.010039831320422401,0 +piqa,acc_norm,0.7595212187159956,0.009971345364651068,0 +rte,acc,0.5523465703971119,0.02993107036293953,0 +sciq,acc,0.911,0.00900889339265153,0 +sciq,acc_norm,0.903,0.00936368937324812,0 +storycloze_2016,acc,0.7311598075895244,0.010252563090396087,0 +winogrande,acc,0.5777426992896606,0.013881582030658545,0 diff --git a/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_3.json b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_3.json new file mode 100644 index 0000000000000000000000000000000000000000..1c5b8b5e5cc265cb61905d23ed2315715d2f4a98 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.337, + "acc_stderr": 0.014955087918653602 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.014933117490932579 + }, + "anli_r3": { + "acc": 0.34833333333333333, + "acc_stderr": 0.013759437498874082 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.2780390107976315 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.4759012148974308, + "acc_stderr": 0.004983982396187369, + "acc_norm": 0.6304521011750648, + "acc_norm_stderr": 0.004816958817726088 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.02993107036293953 + }, + "winogrande": { + "acc": 0.5777426992896606, + "acc_stderr": 0.013881582030658545 + }, + "storycloze_2016": { + "acc": 0.7311598075895244, + "acc_stderr": 0.010252563090396087 + }, + "boolq": { + "acc": 0.6235474006116208, + "acc_stderr": 0.008473882279194591 + }, + "arc_easy": { + "acc": 0.6317340067340067, + "acc_stderr": 0.009897286209010894, + "acc_norm": 0.6220538720538721, + "acc_norm_stderr": 0.009949405744045481 + }, + "arc_challenge": { + "acc": 0.28754266211604096, + "acc_stderr": 0.013226719056266129, + "acc_norm": 0.2986348122866894, + "acc_norm_stderr": 0.013374078615068752 + }, + "sciq": { + "acc": 0.911, + "acc_stderr": 0.00900889339265153, + "acc_norm": 0.903, + "acc_norm_stderr": 0.00936368937324812 + }, + "piqa": { + "acc": 0.7546245919477693, + "acc_stderr": 0.010039831320422401, + "acc_norm": 0.7595212187159956, + "acc_norm_stderr": 0.009971345364651068 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_4.csv b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..8560d40479446525e5470eae998e18949e1f5fb9 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.358,0.015167928865407557,0 +anli_r2,acc,0.317,0.014721675438880233,0 +anli_r3,acc,0.33,0.013579531277800925,0 +arc_challenge,acc,0.2858361774744027,0.01320319608853737,0 +arc_challenge,acc_norm,0.3122866894197952,0.013542598541688067,0 +arc_easy,acc,0.6308922558922558,0.009901987410242735,0 +arc_easy,acc_norm,0.6178451178451179,0.00997074728129242,0 +boolq,acc,0.6259938837920489,0.008462855721594175,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.19658119658119655,,1 +copa,acc,0.78,0.04163331998932261,0 +hellaswag,acc,0.4750049790878311,0.004983542768853551,0 +hellaswag,acc_norm,0.6311491734714201,0.004815073334000603,0 +piqa,acc,0.749727965179543,0.010106561880089782,0 +piqa,acc_norm,0.7573449401523396,0.01000200256970869,0 +rte,acc,0.5415162454873647,0.029992535385373314,0 +sciq,acc,0.921,0.008534156773333435,0 +sciq,acc_norm,0.916,0.008776162089491137,0 +storycloze_2016,acc,0.7332977017637627,0.010226634575145221,0 +winogrande,acc,0.601420678768745,0.01376035717687383,0 diff --git a/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_4.json b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_4.json new file mode 100644 index 0000000000000000000000000000000000000000..498d23e9f38e3c76712a5b5fc02ee9d4a55512ae --- /dev/null +++ b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.358, + "acc_stderr": 0.015167928865407557 + }, + "anli_r2": { + "acc": 0.317, + "acc_stderr": 0.014721675438880233 + }, + "anli_r3": { + "acc": 0.33, + "acc_stderr": 0.013579531277800925 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.19658119658119655 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932261 + }, + "hellaswag": { + "acc": 0.4750049790878311, + "acc_stderr": 0.004983542768853551, + "acc_norm": 0.6311491734714201, + "acc_norm_stderr": 0.004815073334000603 + }, + "rte": { + "acc": 0.5415162454873647, + "acc_stderr": 0.029992535385373314 + }, + "winogrande": { + "acc": 0.601420678768745, + "acc_stderr": 0.01376035717687383 + }, + "storycloze_2016": { + "acc": 0.7332977017637627, + "acc_stderr": 0.010226634575145221 + }, + "boolq": { + "acc": 0.6259938837920489, + "acc_stderr": 0.008462855721594175 + }, + "arc_easy": { + "acc": 0.6308922558922558, + "acc_stderr": 0.009901987410242735, + "acc_norm": 0.6178451178451179, + "acc_norm_stderr": 0.00997074728129242 + }, + "arc_challenge": { + "acc": 0.2858361774744027, + "acc_stderr": 0.01320319608853737, + "acc_norm": 0.3122866894197952, + "acc_norm_stderr": 0.013542598541688067 + }, + "sciq": { + "acc": 0.921, + "acc_stderr": 0.008534156773333435, + "acc_norm": 0.916, + "acc_norm_stderr": 0.008776162089491137 + }, + "piqa": { + "acc": 0.749727965179543, + "acc_stderr": 0.010106561880089782, + "acc_norm": 0.7573449401523396, + "acc_norm_stderr": 0.01000200256970869 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_5.csv b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..94273be08fe4b681d480ab5a3551f42a4956fe9f --- /dev/null +++ b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.329,0.014865395385928359,0 +anli_r2,acc,0.314,0.014683991951087967,0 +anli_r3,acc,0.3283333333333333,0.01356203291952902,0 +arc_challenge,acc,0.295221843003413,0.01332975029338232,0 +arc_challenge,acc_norm,0.31399317406143346,0.013562691224726286,0 +arc_easy,acc,0.6426767676767676,0.009833205612463116,0 +arc_easy,acc_norm,0.622895622895623,0.009945041946366527,0 +boolq,acc,0.6247706422018349,0.008468397820914275,1 +cb,acc,0.39285714285714285,0.0658538889806635,1 +cb,f1,0.18803418803418803,,1 +copa,acc,0.77,0.04229525846816506,0 +hellaswag,acc,0.47649870543716394,0.004984266543053124,0 +hellaswag,acc_norm,0.6382194781915953,0.004795337009118188,0 +piqa,acc,0.7519042437431991,0.010077118315574719,0 +piqa,acc_norm,0.7600652883569097,0.009963625892809545,0 +rte,acc,0.51985559566787,0.030072723167317184,0 +sciq,acc,0.92,0.008583336977753655,0 +sciq,acc_norm,0.916,0.008776162089491132,0 +storycloze_2016,acc,0.7247461250668092,0.01032853840050057,0 +winogrande,acc,0.6053670086819258,0.013736915172371883,0 diff --git a/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_5.json b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_5.json new file mode 100644 index 0000000000000000000000000000000000000000..187ca7a0438fb9dcb659901552dba88b654bce23 --- /dev/null +++ b/4b284b84bc4seed2/evaluation/rankeval/4b284b84bc4seed2_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.329, + "acc_stderr": 0.014865395385928359 + }, + "anli_r2": { + "acc": 0.314, + "acc_stderr": 0.014683991951087967 + }, + "anli_r3": { + "acc": 0.3283333333333333, + "acc_stderr": 0.01356203291952902 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.18803418803418803 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.47649870543716394, + "acc_stderr": 0.004984266543053124, + "acc_norm": 0.6382194781915953, + "acc_norm_stderr": 0.004795337009118188 + }, + "rte": { + "acc": 0.51985559566787, + "acc_stderr": 0.030072723167317184 + }, + "winogrande": { + "acc": 0.6053670086819258, + "acc_stderr": 0.013736915172371883 + }, + "storycloze_2016": { + "acc": 0.7247461250668092, + "acc_stderr": 0.01032853840050057 + }, + "boolq": { + "acc": 0.6247706422018349, + "acc_stderr": 0.008468397820914275 + }, + "arc_easy": { + "acc": 0.6426767676767676, + "acc_stderr": 0.009833205612463116, + "acc_norm": 0.622895622895623, + "acc_norm_stderr": 0.009945041946366527 + }, + "arc_challenge": { + "acc": 0.295221843003413, + "acc_stderr": 0.01332975029338232, + "acc_norm": 0.31399317406143346, + "acc_norm_stderr": 0.013562691224726286 + }, + "sciq": { + "acc": 0.92, + "acc_stderr": 0.008583336977753655, + "acc_norm": 0.916, + "acc_norm_stderr": 0.008776162089491132 + }, + "piqa": { + "acc": 0.7519042437431991, + "acc_stderr": 0.010077118315574719, + "acc_norm": 0.7600652883569097, + "acc_norm_stderr": 0.009963625892809545 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..166b707be61c576d52abcebb469c9ccc10f36f35 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ee7dc858b8c843f53dc959ce40dae61461d83b8173965d6b4d3aa3f933a39a9 +size 199058647 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9444714487f5923f6a493416b575d1974077587 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48c0a410aba313cc016dca65699b078afe020d6f2973c11b58640df695cd3f9c +size 199058647 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2178de5381be5f166407b10c6b32d987f8a5bf48 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a5576a15f3ee9b9989948d8e2d162098a5717ac1c637bcf6dd42a4f4c9926b1 +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e97941de3ae9ec177a5e5138ab5ad8e3088a8731 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:346310d0c31f26b0e31014b89b9d0dc9d485e5ae77484ab4c89fd62215dda622 +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..797c10c6fe6d1c8efdd7eb3438fa1071f9714539 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41388e692fe489d3ad34c265135cbeb51e418dd80bdd1c75e0b2014f723e8227 +size 199058797 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a892dab0f4d7874a18d2731a41f405b8eb893704 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2d70ee3ce0a7ab3650d5c9b02b5ffde07db7fef5f101ad22098984dad261b5e +size 199058797 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a5c8a048288d06ebc2a5e9ca0bee0d78c437271 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67d6df02b7603a646bb0b5c5b4295adba124467e3de4998390dd22150c15109f +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f92f571ff7402b80fc62a618e6ccc7b0d7c0c3d --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7df461c11fc4770ff9ff70c9f144344d649c9426eaa9b46e83d36de4a6d7ff98 +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f02733fe5df833e28baac551f91be0ddecfd145 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f06f74d0b7f04436af338d2db8a7b65a64afaae53a612767dd0fae75feb46c19 +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78930eeb3941dd49e39733f7bea5034ce2d15d88 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aedf627063250b128c09921e67647ea298bb882e7a0efc3d0c98de2ba3dc83cc +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03f736814913dcfdda353505215d2e014c42358f --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5162ce78e86cf573191444093374e07cf3ac48afeab1d596d8b19fca7919ebbb +size 199058797 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6504d6d1b2fd8528e5738a227a8ed3df40bf6484 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0dfbacb3c0e9aa106f39ae15c030661a2c5b3b16b0b6e3b46aab88ec7baeee4 +size 199058797 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab3bb2f7b3393a3eebf6798ca08296709f30be21 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f84df2a04175ee4c6eea85885d0da5a97c60e2fd428db7e180c12be6aa4d338c +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87cc535cf50bc3f01c4daabea6e2aad82a528b7c --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:256f85730d4cbc88ce498d76f276d01c9efd7e86605f95a718fa1d8c1f55bc1c +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7da5db9327feb8c40ac55723d4983d9b98b3b1a0 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fd39a946bbcef26ef120acca470d6c3b994db1ad1b7efe135ec4fc7e40b57b6 +size 199058669 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb3bfe28c4a61e2161ded2ff3d2c1774239a34cf --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dd3a47e945203605d6b32107913338a9d9e5ddce115d335efc03ae9c86aa106 +size 199058669 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f39cc9b6e0017e4a79fcd72f25c2a5b5c0efb99 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0cf9217cbea2bc2a6e8b722c5dbd7fda479d458986af7f405ae105dbdd9e610 +size 199058797 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e8dcb8d739f95a2378f15f06e04c0766f014f39 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f40de08e80c0a3238f5b7c3b4304f10c1b690d4aaf1fe8bf5fc03cd9b92d2531 +size 199058797 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0a7378a4303e01e4a9766edc3162462d1c55ed2 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74b41070a413ba4de2a505872e4a32b3d82aa97d001b222612f1b0f3fba7dcd0 +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..750ab0748b87746fe5a7de07aa2ace8b17de3e81 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7999d41892292154d64550cb4a48fe664aa4921df050e53df09c8807abba06b8 +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b8bde3611d48331eacb37c62bc8b9d6092bcddc --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac422ea0db6f714e5865aee8021e8224e0689f2b36576f0cc6910fa135be8935 +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bfd39914e5931c0706526c3e604bc2e88ee5f06 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fedd23677566bfb69ee613fae46fdb0e4d8497f99e8dd8a66fa8ec251998ba1e +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c1cdf1b7ceb056f9e35331bccd47a3302677fb0 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46221632ef48121b3e75b4bc6b828a55098fed7b36dd6087fd0a8530ebe7ddbc +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2686332efa59fef486e6528c3375770279fbed68 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06bc0aacdafc9162b74dd8e885dd77e5629a1bfef10a852fd10a33775b8ef273 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dd1cd865bbb2f3037720c8e4adcb76179699555 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e5904cf9694e89ef8355a6817d67df542b9603e5fca30c2708a12403881f466 +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e14f37b47195d099373b99b913b52b5ea75a76e3 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1aa6e26e8de7d949abeadb19d00a17972e84f44b88f7329ec7c925af2b6ffc3 +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66068974703fc80d5fa50f26bfa94c90959c22e8 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47296a761efe14f543f22de63a17c319ec581e18dd527ab8168d248e38352c5a +size 199058797 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80e9c71b40b9af44ff901d6da7926904948eaed3 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9259bc0ca9769b1b2c214d179a3e257f1de3ec795b741f08760781ab7a66f4b3 +size 199058797 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..972a9fa01c7c0e369363a9e1bc5d1551d919be63 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd046772bf2072a28bbe1d1f4c0d77d5113963154eab2f7537ea65c9fb8ae9be +size 199058605 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adc2179ad9b312295e12794771f0588bdc6ccaeb --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c331540ca2dbc5e76a6e2d4cc6fdf53d861ac185dccff3d954856af922371b75 +size 199058605 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecaa39916bbe474e220e2f057871c975dadca1f9 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3630ecc579a637d5d4abae0fd134a685e1de315bd833df8adaf58254c71d499e +size 199058669 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c97b29b935ee2f282a600adc046cf97fbfc41171 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be576795382b43ec9e57a4f61de3f1475a2114c58747c3f13c4887a77b6a8780 +size 199058669 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6883f0480c9469f6da286cea1712399c5c937d0 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd2342c9fcba09b8da2f0b97dd9381029561874d261f9a7fda420f2188e8fb10 +size 199058797 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b98f46413c24ccad4935f58e771ab6c8bfeb5bb2 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7289350f81b1907e4c77fd950f96f8b1e2afc3317792d949bafe5ee3b749a23a +size 199058797 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32e533b776315002201d901120ae74022c94f609 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05d3a9b1883076d11e6479b1c33f118ef84405fe27be2501acc37dd3fefd3d7a +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e324cda0f434b0e8cfadcac02c847756f69d18e --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:688d4f78b9b1db92001fe73098eb3d640c51ad4d1e8740f9795719d91200c2be +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30c45bb4e41c86f95231d1aa9ec71a7a76c576b4 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4245c8e59679f90213bd50051034f7a3fb3b39717b7ce88a6d676ea8197f843 +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad89fb421b9e1a96263a5344f8963bde680aa8ec --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62d15628eff61e3b63073220bad4f2e55777920bd65901ac7b8aef1fe30db439 +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8671f681b6ccc2fde36b4e15495b24373b69b511 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b05d732a665d1c1fed059a26db5c913322572173a225288aa8c09c17b3f3082 +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b46ca5cb93b15d6acb4b413aa6e369c14b991aa1 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a61d1c528e00bf74684c3752217b1757594ce4b8db61c3ac83fe3d7408b76489 +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19fc12358fe756ca6d379f0d4c3c67fea669fdcd --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5acc2a4455c15f5f19bdd3b3eb18fcbd8a6faccd2ad82970ed2e84f39fc4a25 +size 199058797 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc6927a4c948cfcaa4ae608e329adfd29ec62d06 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a8134f0d1e7d4a1158c704aff4ee55be74341ef2b6ef3a835d47ca669dae2ac +size 199058797 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08fc97ba00b1c075139f9387a7ea33471a91ab55 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5699906a286c85797b8a541539b1a6a49b370192bd2ccd11138e23ce47003fcf +size 199058669 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0f7d35752305576128d5cc4a8e0afee76710f7c --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9f8c56b084c171e46084602b14cf4d037b8f00982319bd93b747f0866a49560 +size 199058669 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0085a5fa3ec76f5d96e3667fbbd7143bb92cf076 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16a4151eb46cdf7c9163257af2584590c3b6203c4ad657f935ae4dbfdcaa3de4 +size 199058850 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50dbe20997f4343caa6eb8b659c9ee6879760caf --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3938fe57b17a1b2b919f7e8b61b4a40bd8699d99c7261ffe730ff6c46a945c1e +size 199058850 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9795d895eb7916d84f2c771b563f3a64b54ea485 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d02f22d4fe9f5cb91a77e86758a43923d00990dc6af71066b9e729104ae22c5f +size 199058669 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fed146dc63b8f831fc38bf6db9c1d5941911255 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96a614ba7936ffe59e40169a6ef12c7fd5021c3fa0e04e7d0e221656b0d1639f +size 199058669 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32122c111915a1a475b209faa42a91eaacbf5ca2 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2752d67b3ebe386159cac6cfab160306d26ff5bedd565afc3c46bc71d05d9ac5 +size 199058797 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13ae92abe89692080d1e0fe51107c8120f2882f4 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdb0a273339512942bca4bfbe773e55d032651f805164204c37bdd61f0906b3c +size 199058797 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65569d498e75ae36109d3a74a054d0db54641576 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:366c3b9f34e8c515a1d7f092edb1a68fca3d41142da822092ccec6f594dc6e19 +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48bf3ac3589f76fd4676be60316e4621f1aa802f --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78a5439bdfb7d918290a4367f09e02e44f7248c39141c7ae6f6bb025c564026b +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8caafea879b0af17731950f55d90ee7f53459e16 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15c6221fad700108e55fe4f364007b6ab3693a853d0627987b06c454e6617f6a +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba6475a2374de43c50dbc15d7057427ffcd98190 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0594018b38cedb87ab4979710ab35e415b362fd2ea8eae1611fadc39554ff5c +size 199058733 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7bf1747e2aab6163a3c157708603a4b7378a5ae --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff6cef8f388e54bee8f0ca65e1462de49d0de9c719ee3db4e11bc9c93a91e15e +size 199058669 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e411b5515b782564808a872cf5f1e6bf8a93d13 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f64857d1f75541b3b906bd55e740f53518d3e387ef4d9b7b95c278629481268 +size 199058669 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7469f36860ea2bf8227169d4f4e9bfdd1138b797 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55fbe9f53da5b4a18f713f9c26e8c0cd52039b53a70bce0d4ea92a6846cad40e +size 199058925 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..297084171edfce6a25da01a7c1ce86e40fa6fd74 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de0fe362b25d49ce090ce4da8b9804c1ae797523ed37f0b2b016bae45adbe5d5 +size 199058925 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf59ffc469b68bf234831f4946e61e9e7cb98181 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b96ebdb423812434e30b72395b60f6a8d6df1338ad51e35e7f497e7074a37fb7 +size 199058605 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..962577de1d800ec595173cb417f1221dcb196b5b --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55fbced9d4e88cfc528a904de5d1d6e5a4303ff19e88383f2da71978239c3bf8 +size 199058605 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..363f2ae43b0ba35b83090f4a133491ebb434bea3 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:698d794db531e85de20a77ef0c93f8805b0ff66d7b7c069db1d8462e7f14252b +size 199058605 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a20889914c91835c8eb13027c736ea4171bbc9f --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04fea719a2d12117a99a4fa3b31af6981e2a05983bd820c17663accb2c4d22d7 +size 199058605 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3053c1a10a5ffd255189daa16a3fc6b55a121f8b --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5a7be9e6e1b99343e100d06e065961944fb7a0de85e40d1af9fd4e99765550a +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b2612e426495619ed3cf808ac1361bee402e308 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ddc79d10f05986ab9918d34c5d61c6dbac0ff69820e495507aa4c9b495bf694 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23b0bf895b103e66c876ccf4c9020990c0bd221b --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15a9671e39182bdb1c81955ff7ac9bbfb42722b3a130fddf90aa9af56fb0b6da +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..334a13796801f8a4bb17cff97bc2821bdd2bfbd3 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a4d1e33cd23d58f2d1c88221a4374558b30017ea65be539d1b0a64adf91289b +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cef4609939ae142ede7870f89a96e8f961665af --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb59bd412a1091fa0a8adfc0d409bb414938307c70caa5246ee933e92e297b32 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..125f88b2bcf02abccb0e0e6554dc43bb9b92b3c9 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89109bb5eca2d1f7c01c9fcbaad22ed3cb049cbd8cbf7f3b5fab09e33aae2056 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1d23c10afe1aea5f9437bf04fa4469024300b9f --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebd46c30997411b58a4f99de684f06948b81101e9f8b776b1258fa7e1ece464c +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fd5b9321fbf9701908a227e27228833ba374b06 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:166bdc09a6fcb44d0a93f95be167d0219b618b1fdfcbdfaac8dfb255733d2e1e +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..660ad554db3acce30af289e835d3b5eac601fbea --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60a54a1d9bdf8e27171900934e70b7e1926db5383f20c90def78b3376b08aa77 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b86cf97a4c230861186d742392e44efebd25da36 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10dbe49b248fc93a896109e5bca196e462d4361883d21e68c7c4a2e867b8f675 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc630e19d0c91c31543e014fb90c93794b3b520c --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37b7ae0c32723dc5bcc3904da5e02bd69ea52c912e8ace3beea65ab859fd7629 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99cb0ffa0953ecc2a64fc28a87a35bfc816a7018 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55a0055b2b0e21237d5092a122ac24bd99614d259c91bf523ce4eabe0c093127 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30a80ecf0ef772ab45d98dcaddcd906ed022e8f8 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6078afc314e54a3100b9efc3d4b532cec969ae348177fa44eac4e9b777ea665c +size 199058978 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f05d5423d9bf95a26bf3864407ccca93bc96011 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c7e696c603f52829da38ffdb445857dee160f9e8c3204a67e4b339295555cec +size 199058978 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..badd385d5b27ed10b8015e652c186c0d509f03d7 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb0d236f1323b2c0dc8cbeeb8f5da1190e408c829e34775632da88499e5a8377 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a23826bf408f823a6b327caa3ea9daf4db6d0cf --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c9e515a13c83a4ac8814b3b75aab3a8520ed526acbbb0c248b49ddb7b39692c +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7d7f8fb7cc7625cddeb4182e4cd053316bd89ad --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:980999d630da4f03888e926d48d1d93d9c13511dc815409176994e9d2182646c +size 199058647 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bc3b104f94e47fc60ba9e353d1b283921de7e80 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ddf05ce6d60bdfe5cd862252cae5d20ec7d39c1020098c1acb55e6219b3921 +size 199058647 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6efca33c19c2a334d9e84938282b8e937e8663db --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:097bbaab5b0c6e9cb5649aba0899ef5431a27b92f6552c7c6e6d662cd34346d8 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4f73aa3d29836a44dc88a98fc6bd78b0e97dea8 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:183c8ae3bdf6b7d360051c8ca87caaf2e93e42299206f940575b90eb88bd2c8c +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b021e0f7ccb2c7c98ebed3156dae310b91c813bd --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f3486ba1b649ea99b627be0e2add2bd8f29ec67755940ce0b84b0df1338729e +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e316277c5316f43be504990e08cafd949a06c49 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ef720ea964859124da4efda0325df5467bfaee16325c3251205c2dfe2125565 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f76e7b5787b6f4e8afaca62bf1f7c4215367aa08 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:540a80101620bffe802eb23a228b5e0f9f4aa92f6fd263c739c1fc605e9d79ce +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a5ff42ce1195dccd1620e8342a1ded0959312df --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12824920741c0ff0647c1f40af86fbf1d990e89d50468aa587daddd0c98804ed +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14fab53ee09b00a07ce52af7a9acf0a235a49fbc --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:382dc30c03f781b0558adc4b22ded2373e8cc4ea6a81355fce15724d140f47db +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd60c7287d0649a09765eafd529c2b1e50aeab16 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:752a9b2209ed2a64138552e206917fd9d1575ec744d344d7771a3823b783347b +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70c4a297466aeb0cb72c4833c18dd5ad8c443c5b --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:171e888b206b9ea7e9b0145099dde04dd691307ba0dc607beafd38c3a6a0a77a +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eb5df6971c034379d06bc9ccf51548aded59b2e --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:860d044f83088253fe11cb929d6c121a1156fb2d570fb87d6da54f114d2c748b +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c93dfbd9b6081da671e7e92635d1b74c4dfdfca --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:433ff674254eb6c4585af09e07f9bbf9cdc979e2986f5b9673141efcc6151b61 +size 199058850 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..096b9d78ab312c804fd5e949bfece7096a9211e8 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6cd27059fbd44a0d19d4317de447c6a247b7ee878734fc134ccbd03b034f03a +size 199058850 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cdae040061303d0cf0ee13bf7d6b44552341f4b --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f94053e3a4340964ac47166fb4987cc53f92681539ceb3ba943ef14c115bd64 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf0cd91fa1d2f8ed3b0d3f4c8828ce97113e5cca --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4128c1b6ace3c896fb1435ff771a9191111827ae636db3d3b09c437eea542fb +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de819be952e55b52472cbba23afd7049d5d879a4 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cba2090eede784360d57a7f9536a4b4120ac27240adef9c32346c8963dc5a2f5 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f719c6c4740816117ccc6d4c197893cfad7078e7 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7533bcbb448870211f595141e5466e1890f803d675dec68bfb5472364c54991 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..330a8145a1213f7e4d8d6e8829d698843268d76e --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adcdcb3f5499ab55f05885a4f59a4b46b6520f48dea596b8e9225af6224a57df +size 199058594 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a37466318905dd51a1e095d5f7d5f312709e161 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcd701e211e6f2a1482cd31e6455967dcd4dd23dbbd462b6d55339d4def7754c +size 199058594 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64939becfef162aac5cabda232c3bbc99ec01b3c --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f43d8699a3262b1027b3f91c1ab7fbad3ce8013d791ebf882c476f294b6e8d3b +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1546c43fbd87ea50dc2039df679cd4b52062317 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:217fe47bafe9f082976fc2be1d7c21d8a3c3dfd82abf067d3867999cd32c75ac +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a87fff24dd2083d44ef565bdbfe6986ed628de5e --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24cdba384ee2f30091087ed250fe4b8e2ffc2579c5c2602fadd2449fb78d237b +size 199058711 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..073ddb568892fc22afa2e4849f9a885c72c9629e --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01d04611831e5a44fb0816e87aff489d4a0c0fceb8143b8918d98cf26ca806ba +size 199058711 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ed4d573869528f402d86f6613a628cfb1c3015e --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5203f00e00b4ecc456e026b22bf4a68e35d0d87551ab52a733f48b6ad17777ea +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cd2fa9861adc5dbdb88f1a964d3b0dee5db5176 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c68a4da8ff675b36c10569d36242a2b4d2e8f10a2a736ebda8d8596c454c354f +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc5ff7f049880d6f22ed2e68ae4703a7e0ef9489 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dc659f228d2857befb068d14ad4424a0f3db9ba2d05ba2dd10baf544750b8a9 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b02e0f110a1a8e98885f9aaa8da29272b43f4cb --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:669fcf0e36564cb1a75c15d7c42a66ea35fd08b7651e3cafe56c3d040a72eae0 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d15988c331aee483bff971052374226d5c223fde --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3d091f5b1630dbf45cb2ce2bb1e038230449776fc915cf2dac38e1281c40d91 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6afd87613e7be2c35f27a03ec0dc2634af925ba1 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1f950b8dc6b18c4907eefc6d5b9c446333c984e7b0f80f7ed88aade3d0dedc5 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ab1b3271b4bf39722c661063a6f4a43f41900e5 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3488e4bc0b1054516a352a87cef2d59a9b0fb13549c06f958f4e5ec27eedfcfb +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..caf011704897b37bd73f38e0462ff307f343a775 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae2ef34bc65b3aafd1dbfa6bcb1260d5094ecf8667a250639aa3119a7b5f9250 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f895e6e838608c3e2afb1cdc55e313488e9bf971 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:277b3df4de3a2ec1c7161d6f212509fc96fa0edf268d931502eaea3379ab61c9 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab4f896de3b37231d19da2a977f849fbe352682e --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:497f9269b791de7019923c41073700a070346049fb5ffc5dea98b76165065fab +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c9b890a88127e116c5dde1cf2e6f2612b346893 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0fe7e52a05a9e978beef1d915a2ad8534555cb12f82674874f11207f1d2076b +size 199058594 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..922c0a793ccd1d8f916c3b1ea51d46c0589ddcb4 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e94dca97255d07fab51e9ee72301e7adc9905628b4ece1933fce7fb824fcff02 +size 199058594 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2e1d36439499b07c7b5e137586a989a2e6fb6a7 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:759ccbcfe8574ddcfef9781af653aa53f6795ed4a5d5e07d4520e7738525d142 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dcf7bf119bb65901403de33f6e2df550ecc3ad9 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a667d9b0958a5fab5d82bbf74d44c3d836b8f8e328809e522d87bf9920c53af7 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98c01203ed93d13f4d7dcb49febee1043578d917 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe1f955b5c1fada42be537c281fc0918eb94790a2a43e7b8c85404579d18a141 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c75c42557e93d748f9bc8a47a75a56e2c5e6fad8 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfbd5e87f16be4e5a7fc76c1396bd8768069cf3c76f00fc2951767aee8da2933 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71344b1c6aaf8d4912df4d31f3b657bd9a824b0c --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50880b6cbbb29f72e045a2fb4d93d5d75af86337757a5f4874867de30d2c42bb +size 199058850 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28b701b2ed433935fbddacc20ff77bf28dae7723 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf2b7592753e43844f7dec4426fda3fd69ed3f31e0419cb40d6d5dc36f5476d0 +size 199058850 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0151a1e7970dcfc08ec35a8f80e76fa7ceeddbdb --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:855e60bc9fd75de01b24a6564f55a8b7ab4ebc32e9fe3296d490114381730250 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5179a23bd9bf967bd276854f587329946ecaacba --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb6050a4e5ed0822df1ad18e4868aa125e089ad3d49866bbb95ad048b4e323bb +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcbd2b8cedce7bc2ad6a752aefd5e747e38020c6 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7cbef6015d3b453c1e72aadc1467543efa806d99c1212e038324c5c46b0e555 +size 199058647 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db54c52f7beb8cdd1c3062b57011c50f3d621776 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3875965f9aa7ee3c111671bd511ee4b0f9276587482ea398c6d11cdba22f9b7 +size 199058647 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..303519ad9fe802ba5db89e28ebeb33b304c9a25c --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9d27d1dba0b8ab51850868dc7cebc1bdda58fc5c7e7deea601dbfcbc1baadab +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e61bb197115ede40bbbb433fcd2b2a869ea1151 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c012aeebc3f459f20cd8a9a63773343d9ca818591acd5c147a547324fed7cfe +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf57395dc8b3b71d4c41b27d46f73c2bcc599898 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8a46e4de7332a2c359ffb43f25eec9a91b74f5499f9b9006b195f85dc9752e9 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b8d30e9659e5190d80ad2650813f82c5ac366f0 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34e6c3acd91f460f4a6ffd81fc69a9e89f9306c81c4383fb45f403e3c500a0f7 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..229464ded5238fb7756ca7a90594df654d50d562 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6adcecdab6c24c79fe6975919b03a4dac770a7d6006e637ab3ab1214e2f471d +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9151f8a586e08efa1ccb62238064a286968b86e --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93c8eea053cc9c97aa89602a1e4596e109afb828bf94b0d18fe0df1ce5b7e61c +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ffcbcc6f4f2ba67bf644e7ff39163b0c31e8eb6 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51de2998c17ada49603ee341b95fb152d3791f7a5dbaf62db184b360fd6b187a +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4589bee2cbcf49c679e1cb7aec3a897916a608fc --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a0daf871e28eb9437ac319ade2fd872236b046c3c7ae30992276444ed1cd162 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e72ddde648cb3267f76dcf2e4905d7f04bdfbdad --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7adbcd19ecd06a0ea3a7dd08591a8253d8f62ace94b695f9e3ac22d862376045 +size 199058850 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f643a5154f9a746f36f7fb95ed257d15327bb59 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b39e6436aa4bab819e0fbe9bc8d27e19f9f9dd793081d22345bd4d92c009ee0 +size 199058850 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce3eb14302f6cb830d5bdc78d299b2c5a425af20 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:276668f044cb0a076eac4a46c44ebd31831c46e85624a7de3c8f35211549207e +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3056238a544ffffb46d76a4804cad2a85287c39 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32a1cb3fdefe55a4f8c819e1025e45dc34c9901e3d91a91efc5c71739ec69e6c +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94c59a62165cdc4f7e109c4a259d1102a802f4f3 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58f820ec9becf6d0659374838329a104e400b232ad7cef68bf10b1fdc57d8a33 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecb8e76b2a88b4af2240b70e6e299feb1ca265c0 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7152604dd9bd039960b299de50ebcfffd5e665a336c73550dfeedb6d30a3762f +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0870773174385e1ef74f8f7781eb018de65dc56 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fbf2df645222ca8524a9651cc9e5cee31de619b14ae517602637661172fa85d +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4d7a5e906785f28994f11f851604bdc9921c949 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98722b446dd5e21163c53e4f0a3074906936dec4627527c5977083cdeeff4932 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df3d4b1eb378d4b0170d686e516a75861d9f00a3 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac0e53d78306492ccecf05a84721f81c4d4eb2ca16958bdf4b4ab88b0d177855 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdcf0e9406c8cd8371cb8f44259552f9ce42f563 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ee29726d5eba4cfea5cf8454d0c6afa66d6f9b93b102aa3e725eb1cd44d9f0d +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..100fabbb432d0fc93ea93df97b74a68491882610 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e1896ab0273598d304292d52f9612d770fe1d47c409062c9472270125dd1216 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21af111d755bece7e6a38b6a0c88c315e1e0125e --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f181f630613dac3d1fbad62c5f793475e4130a8d7ae4f6c15ec8f7c5b7bfc94 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ce2c619e11b06f5129b6f6429292a7731292c4f --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a770d47c858d907ef920bafac3e670db51466cc34aefaf6feb9e2afaeec269d9 +size 199058775 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..747b529c454bd6390e40740c6d7c0373be128cb4 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47cbab7e4e1e328dead6113fc1b4a9cd73c678ee8305276fa2b35669fa857c9c +size 199058775 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e1fb0b47fd66c9a8557c33cebecd96080c9b34b --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b8205ee43a94059bc8a378710b54931bebe1d24e53c8249fc31599589cc789d +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a22546e389495039bbe1c3a3e568d4ea518945d8 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d3a21d82e706863557e0cb9de2d5f5c8bbd7a41441a8e7289b587a2892e34f6 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c848a684f2f73fe7749c6e3ce69a162a23db0f57 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:731fcc4debaadd67b17076a20e846333f6f1430f198c6437db78de90dbfbf618 +size 199058850 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..321ed9f73e1cb2df47d505526819e0b0d4849dda --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d95f5e8284a6fa59dda73154f93981cf2542e536e32c7d0c1ff59f8dca31bd +size 199058850 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fca0f518286cb702f371f82071c0bb211574f37c --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd46899e782857e377b897a8daefa67ebb070dcedbf07396b80eedefe61d21b4 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60ac7b656e8ec585b4e6d41de5c3a0bb80a58c60 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b5fb985e420a666062061a26a802e0f67c49cb11b85986ce4a18e0f0f8340ff +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45f66c7a98894018f961c79c6423dd6db6bb32ea --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b5b32e087acb788a636f318ea05d5cfddba0fb28c3bf289a0db7aa0b113322e +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d923834589d3aed9bb6a1c7c4d8b2ffcb7b92b8 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50921c0b01674c92d6f794c4b3107e6b5a0ebbbc72545e4888198a108581f478 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ecabbf357f1c18fc483a97748a4cca0a48900c7 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b67a0ad4affe9e497177f6883a6273b2addc74bc5b9933d2cf6fa7b6d37ba89b +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc044df3ce08a86eed5282fc4d7e81c6b57c1844 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:903cb23f777308f72b854173bfdfec0f6509ea026a2f1a0f43bde01650762a14 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89495633dcf313756ef4d0088f2805178285556e --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8adc0a7030635a0fa70a2f155a9898f0624d628fdc55eb340b133935daa3e957 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..168a7f13b25017be72e18df93a72ad6e0fe59ada --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e790b46c6544d025a286254324f4bb2437cae883fc89fd529a5d46f0843d8d5b +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dc2710f5094b594c2df6ce49fd39b5d907edad9 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91c9d2b8ef12e41681fc593689def6e6ab9920ec692ec21da733a7066aaf00b2 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb09a8a1982ba5feb98b72a86b5dd5f87925b139 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f59e43bcbea8dd618acdcf02f7fc4a281a553d8946c116e6deebc10b0df4bcf3 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf20243a4a090c68255a95147009f9382cccf0f3 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9383d57b40fce52adf844d95a662f4e522068e6f16b3ef22acfae31fec25a485 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cae156d7835d3623169c90432496a476678de27 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7fa464236aae7f1ac5131487e711de335ae90d0234865202a51d746edfb89dd +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7da97bd331254e260fde808ac3370b329bc4170 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bfed44c8a264775db742a78287c91d3c9df84b5a6241b6ebd95d430a7202b28 +size 199058914 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f2f54122166c4705d74e70120d1f9f4d31ac51b --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1559231a3bbf27827fbe0596474252c4732b0eb367d017f2c92433f8aa34935 +size 199058914 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ea9f6a0f08bf9f7307b72e144b225976b077ded --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40dbbe73a93babadd0be5f3d451c8202b8e5eed71374cc9bbb8ad42ef914104b +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc71af31ac96c1ae432de085645f51f86d58f980 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e346b7e74346df05668892fd8c20401877f31da6a23593b7b9b859c949c13ef4 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e612a128771e4cac06642507dd458d33d770544 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d1e84aa92a8b97006934f7b3334782c12a44ade60bb0eb528c7c96074e7c29e +size 199058711 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0af1dac894022f81e509984f98fe6fcfccbb7e1 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:569374b014da14b27c13aa810b6784c88aefec54e43796ff931eef4d049e0802 +size 199058711 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48447f8f17806ec3cb89f261b6d875c6cb4543f5 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55ea8c406a9153d27696afd05f4fbc58dd4180840f1b4967d715f5b480320c01 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9add72a86350bbc731ba369379b232b5528e6621 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:236a34b506ea07d8389770c01ed668abd392666de703ef88703b32fe647b38af +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..045c5c08ebd602905ee67da44184091f08245c56 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b37da4c060da81abc5932793dab13f4f57c717cb6e99ba846e2375a5962109de +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c690d9a0e351461088eade6e9daa45e47a17c41d --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7de01d0f874e7b75cafcf9a43ccefec34f542949e7f6d6085901343a30eb420 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dca326aa7cb7dab2099c249b57e16582da40d94 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12b000e10aa1bb17b05b64b83db816c61dc40d81e0fae535d49aa8759e09ec46 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6db5acb440ea49eae0133710869b0c9f29d0c081 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a43dfc825207dfbed53353d437aff7a72fc5b73d8250f5a6ed5056710a3a1653 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ed1086575186f49eb81619734dd567d92ede709 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8255f1ed44669f46b7b80cae762259c3188df2e14a6dff9c11487d757433abe8 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7346060ebea6289c2c64aad3305576ffc75352ed --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42b86ff48e9af3135a5b4537e73ae44c14486e93b1d36e6bd8f3157a7b087f6c +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c3bf43dfc871e949dadfc24a7da3e86460e1c08 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:919dbd4dde4c3d9a867fb6d8dc475cf83b1298a1e7d356da0734504b03add9ab +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88d0baf9fcec95b33179171b5b3d8aa9010ce4c2 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba6c4eca1540546f8ef842797a06c53fcecae247a7ae0bc1cc42158d74cd040e +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf7d49215f4a9139e33465fab2df8e4b172a20d3 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44b3eda37b51c98c39a2420edf7187765b8b6ac50ecb9873e57dd82516b0dc56 +size 199058850 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bfc7d3355e4aaa07376310873dbaf6906521dd9 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88be8dbd41b1ee5ffd689d49b34db19305b72e57cff200ab062e7c5c24e40db4 +size 199058850 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..451cad148a1abfde574368cd8e8b547c04ab4664 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e9ebe15d9b67ed5f11f6a4ab2ccda89c8ff16a48ff0fc113b0d1b4368c861ca +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..721d192e4060b92a1ea616d89449c688e6c1b3eb --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a57a45abc19459597af1c6cdff1e30d31d09d737a87d0112750faa191afaa4d6 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a00366b3ff158b4eb70ef7947d4887e1f8412d43 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75b21cb892ad57b2a21495474ab1b3bceb7cb1a08a23d40be380f6d0c65ec300 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ad83f6a3eaf150d30539fe46274e85740ad0509 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55b8a5e55d092bf1791072f65936b5f62dce4f1e32e5bf9dbe78d02f0d3e4a50 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4047ae009ea862cad7942b23c31b11ff1e952b3 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e4193850e49015636b3835688bd361008fc3a3c97d0fd4ccc86852d3bd76686 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c454dbf7c5b4d93448cc1b321ae6bc682137e8bd --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f3f7e6a465f72279455dbc04c2ec1946f55cb5e6359d6a6cbdca88c50908819 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee3a4084e457a8e93348d6335975b313b07f76c0 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2249f644af39a72bdc058cc97d573953c92576d0f18ea0692883b7821d2e62ea +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c7bb1fc5d75dedee62aaf350f331cc87deb85df --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6703edcf1dd152f22258aa611fd53bf0c66ef053bf0a6464fe3c033977920e1 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b97fbaecc0536c2c07629b0c0dea81c7b0311b60 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a022311da2ef87c924d24c2849999d7832f78223ae9d2df4efa8f8d2e9a19bbe +size 199058647 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dd3bdb2ab91307e93af30ebe2f6423e547ebf94 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:818aa7b14eb398b2eec2c58b7b65cc20bb83ec52844be97b482edd1118ebc9f8 +size 199058647 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c2ff337bc747b019f716f82ebfc12f89f0767e4 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a34150fcaf72b7b3c84599d593a2f29f0eacbec4d745245670b09a08bd3cd62 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08025e14f6324f9ebac117bd4b3df403a7e0af5b --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:485b3b478c3fde6076e1295aef11db4598aadccbdca90833d2e27eae601f720f +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d62cdf79eb455e7bc8e14a1ac5f58f222610632 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1e1af32d6cc6e4d28d5313367b3e6c23e7b7495536ee5e6bba7892427a4979d +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac3e12b6c5bfa398f6e17ec2e75807e4309894b2 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66efb1ffad9ea7ff5836e2e543bfe6af665036c595906b829a62881470d2c2ef +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb3a1d8276e4348441f1a69c55763d9ec3bf0d52 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd60258237ff3e1c95249b60d7719f802cec6812c63293c89287f297928add53 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8150be7c0852959b495fafd10533961cd7c607ed --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84e401b65acef67bb007dd1bcc4a505f2417f56e80e93cb42fb73bfd516a024c +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10da935d4e114fa9cabe621b10cb753fb78367ac --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a6ffa4bc88e967678f028da0d20f4b5cf7b857854f0959f09e98edeb839d375 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2298607427d432cece5557cce2a637d291900f9d --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb6c213fd44664c4a30456c046015285ca2a0839ce443593667e3385cbaca61 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c89ac16460d8074d5d5cfd9b8bc8739fa3fdef5 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7cfd9a3031cfceffe5802f22c7b2236992e956807bd10d7571965211219e625 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d9339b1e4bb02dc187ad5a8e0fe59e68d05fb9d --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cea060e868b21a8874d8b128b8d298c511e0bb4bdec1437bd87dcc5f5d46363 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74f19c579b54c981dc0109e84d9dd58125a3cc1e --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32b369a3d896d9285ffa3ec3a88c0834ff392e9744c5cea10ff7a4d8c52de0b4 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ff8506c441ecf41dcaf567d1bfdb19acc6067fb --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38344df822909f962a1767ff91db936c47537c366a829d2c8ca6d062411cc0c5 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1eb43cf181b02cb3352e29d16a49c63dfddc7a1 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77f9d47bb7755c04c83ddbe12d269ef480eb7a1a912709fb5f468f59c512429a +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e93c70c6c6360c461689ac90116857eab0fd873 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f2b4dea71198c567ec8169baefcfdbc587971f621e8919da7a39f382b411d00 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac82fe3e5c155c6588b02552bcba43b1ff302996 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0935ac23d4bcb91c4033afc8b9234288a6b42e05980afe9992be54e25bb054b3 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8688b5bb2291df705fc376717ee5b507d64ef575 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f47d6635232e968b0432f4cd31dc31b048de00452bb3bafaf8ac6bab563ae24 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc15765a1a96dd7aca1c7ae7a1f21ef05a61b5a8 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eec3e1b77ce80b79fbfcbab98cefd6bd7c9fcf51d9a7fa8a2a63923982f3ef20 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fd8243beee72ed4d80d15a248f58cf499a9b37a --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b60e8d01142ccf678daa3e9d39f78d97813852617ede2f54cc15b1c96dff472 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a7bd34544eabf0dde27b6113d3aa334350a6538 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b63eb878df079d6518f087580a5cc2b25499d2671250762fc1fa83b2bd5a4667 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6527f278ef57e919a3e4d49ddb54df0a111b3d24 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbbc0c26fa5fa0f955cc0e82795ff453b26fe0b905edaabfcd209f77fa0fa4c7 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42d2b412468fe144db50c7842eab9e267b274b2f --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00bf8cb1273a869959e298c578ec2c8bc62b17e456df750a9c920056c2eb2e1b +size 199058647 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f168221307247a1e09324a95171a29a62b974867 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b88a5c44b2fead28c47671a86fc945441c9613a34857da1a474e4da54943fa83 +size 199058647 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0d880a506d5653d2e4f7abfd6d17c3a69a8c748 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d62735ed73aa3b752e5b2601e837a080a23afe3a6475aa6ffac595bb9ae4f82 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..365030f2df64d41729edf8b496c7356a69887305 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:582fba5bae3aa61c1579124be84ae83866422bcf3881498bb164b5e6fd802abf +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0ae54d617c95edd93deed5dc23eecf5bf2fe764 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0adf58c7e716fae6189658ab5b0a46710916764757bf815acb127820db9c620 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f983618bb47d9084abfe0b356a1026cef1ea1e74 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36d962dd880ed80c8f567aeddc98f8cdefc36bd32c9e9c3c8e985c08bf61997b +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73294e1c34670f48a3155cf8aefc72e9c9324fd6 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aae1d4cd03b335374a9fda875d845df3defbe67d7588d11293845773bd25aa2 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1230daa2f1532f14a90f9d350522093ccf213ed8 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf9c32524d811a7c96bc03b2ddb96423c9ccb8ffd0d21ab484f38c774cd12586 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..931a87401d89ff6558e3a78036fd7c8d0b5fdba8 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c1531223792873457a9c2cb6fe6b4b324075e07adafe68d08f59f6f2eec4df0 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df0ea8e38b0ae3c4b250e77b6e0b941ad33865f5 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cdd80cd623d3b3aa86ec23746b35753a75bebf0b1761e409607b0ccead3ee45 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f04ad3382a04f4f28d867584a96fcb446b6a16a --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e9a14f3499da7b849c93676fb305cc8600d5a26106609450ef3ce97ab4bfa98 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7416dca9312f752853187f7ebba535282a584baa --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f17d059890ba1b1bbcae95f9d9980656cf28b3b002d654e288c5369b5302dcd1 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..119f0279306bbae4823a266a48cbf9f229495921 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f6ecd67a0388bde76e53cfa4919018aad1051046201e485d1c97fbf886ae834 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e7a73d33792c170b090503ccb8ef666b5b4db13 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43ce8397c57cd4452ef4e0e5b41848dfd23dc12fa609d25d7c7574d32b1c8677 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f3897f3231c70344bbb876b7d4473efa93e4377 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4361c295896239342695a2b6efff4d0227c5bac1905bce1889fdf66c260589c +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96a58fe15a15db796aba19c731026914a0f337b2 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76baa42a02c277bae4577328d08ff23f46118f15b087b319106c6b15554d7b4b +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a15da2090a32fd6b8f2d535586e43894e6863250 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1ad694afe64fd79083d9c9451cc2b31ff56c78a5d5d4e09ae9b627f544e0440 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ce892f399301ef7af3beed8b7e20343d6d6e49c --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23aaf89ac7f5cfedb1d72d4e75b3787e4f27394d0ff628df11bbcf8dd5c84cd1 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb6642b9396efd80499febc71f80703705e25d92 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2348e52b8dc094ed1b5a974a68909c692aa19b11964aa480291799d3e8755b2 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32e27fd512f5966ead4deae023b9c6739627da47 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c4eeb6208cee741205bc7c35570974dd9cdf687e8ae10839c1b82ae55cf4727 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b6520c15dc443fc8970a8fa6835c4a017e8e043 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bf2be51f48778b96f69054c86f5beacc53b59f009c26fa8cf0fec63ee631dc6 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70c65d2855d56f53874be7b090e584e463be1690 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8faf9cf9fc271d78f207cf409ac854b4e43f33e587a74895aa27d41d10665ffc +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c23ca549cf0a5acbd043c3fcf97adc44dfc1e88 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae64a76a471ce238f7aad14b2aaec3fc315077acd3abbd048d11d99ad2a5c60 +size 199058647 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdca00c3d798aac922c2c097f5b0588e23b87075 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeefc98c8aa3ed6a5dd5f8145d04da5fdbd0a984042f9fdab3246daa59162dfc +size 199058647 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c914bf640f027ada8fd906e110861b6e9333c31 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4940b2c596398704bbb6674922b06a054a5cf9a07c19070f0a5af6539d123dbc +size 199058850 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eedfddbf5175813ac3429a87a43dfd9f194cb470 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2ef9d2136e3a18a7d4cde1af1864a07434ffdaf735cc1a5e32a553c14d678e6 +size 199058850 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5dfd2ab9574517aff68da9d6fc84098089dc215 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c135b5930b7a6ba4428165878781135954b750eabb0acd48df54f05e4bfef1f9 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f090bfe263d0df1c0f487c649c288dcd9a1813f5 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9560b4f98a0596c6c1d593ac312be5e1c54ea2f789eb3fab9b71756b0739436f +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a67e1bb7a37808d2978d48f13931cba2d59f306 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:712f02f5aab0bc515157e14a12b98ef4641c33c0e23227215d6497fc75f8071b +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb396a130cdd006e1717a8b7adf96bd5868737c6 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f87b56f55700444538897ce1ce0c6723be062eb6cbbe20bfd51bea26095b200a +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b922ace63b09061d48346ee15e9d56deef4041ae --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:319640e08106024ed444626a06ff6125baf79fc73931da6168c9b493159fcd0b +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a480f1437c3c9eb0377d8b56e5aaa7e7e333d03f --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df4c6d656b18db3a1ca9a1c086a3566a6b5214b4bc68f9ffccb3c7846e656874 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0be28962d108b6d97b28fd850f5a2363229063e --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:062c46ac3a7c6f3500500446755783ab2bf8149e1d3a29374af7ffbc113600ff +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86aed2bacf16b1b8f8bda336fd345122b243fe39 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:954ab2136c4b2265d376b416b86f89863a144d34c35a480721d4adb94a89762d +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04f9a9fc89a91482a68c5a0136645bf76a120c64 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7920a185dd8bf13cc626264d6544c5c521162fd4930e3bccaea4962d29f5b6c2 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de8ea054bab855f45a92f3597626cbe7055b3718 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2292e593a58e57fca154f16c1bf9600ad6acc87c03626ff8ad9fa4cd23337cc8 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77f5826cf0d9caa0beaabcbb099979e93ecbb40d --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4837383af75d2aab2adaefbc75ad69d6c278eb71cb185b5e2511a1e3982dc8dd +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c158c3f6e84f48051e7a4555631188d80d585d50 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4185846e1aa155e81b201b2de42dd59f71c4d41884d769d42afee83a4dc1faf2 +size 199058722 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..991bea03c9d8a5366184ddb192ca96f9c6cf0e50 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4acfd88b1fa485e8410e979c24adbbafb8f5c84e37bb5a726a34a24904fb8f07 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..463d5f0a088637c6f081fb9f02d1979b43f2d5ec --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e843644694c0c74300ed7e1baabf76af60d9b903c6552b27584cb2efc5381266 +size 199058786 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a79ab8e23c11c6cf437ebd5ef9b3ab3d05122203 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90025865d1361c0c1ae372bfd096149180c9d10e585317ff55f02f8848d8da41 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1cb5c0c29a2340e47742d84d2e4bc562fa56334 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0bf080d71186752591e8d6eb9b2ccc43b3946c436e0586030109317e50ad164 +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a45516c79a2eec3047c25d3594f346fbbf7e7816 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e25d91f2d878481c15138b77caceadfed44bedce76f9fa1543ec9b583c7dd46d +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f556ea1276858363ec241455c774184a841e58d6 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a5cced115e9096c5a2a6b6e2d83e5fded665b0c08728f0a45e8fc5a2e1578fd +size 199058658 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8267329cdd29a6df5c733f9e779d28732b246a97 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7124620c6bd6c6c7bcba7d769ee8bd4ab7556bd6be99defdfd9eaae70e4ffc4d +size 199058839 diff --git a/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ad0c43837109f154b740eededa5ea7fe2bb905f --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1690982edf10abc192092d6e3a189df1385fb79c2e6b375e5565378a8bb8220d +size 199058839 diff --git a/4b284b84bc4seed2/global_step80108/layer_01-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b48e1d679e8f3fcc154ca4dec1534fc8a863d4c --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:841fb8a2d4772d93e650066d0d9fff3b420c737bce0bca7857e69843dd95fe06 +size 167511299 diff --git a/4b284b84bc4seed2/global_step80108/layer_01-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f24ba3db78f204b415a8d9bf6725a5886349af3 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fda2a1b6983c55181ee3987ee84e7cef2c5b1bb32ff7db2e453770a80aa52da9 +size 167511299 diff --git a/4b284b84bc4seed2/global_step80108/layer_03-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6efd0b4436248454ebccac9bfae1a35dce89c6a --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cf61c1840ae2d58796b0e0ee00e17451b7edaad0ce7436c22c8878268266b17 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_03-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e1dd6736ec00810c8ce0aec0d0e2b551adc87b1 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b2f9926107274a23b935e3025d29785d96552b5878aa25f7042986b2bf39e53 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_04-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dea1900cd5d3e06b836883e688e99bb9adb71eef --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f27ca4f808a9657e3890e4e28efc10a26423a4aa97e6e7a9b8505c221e871ae +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_04-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86f2f220cb29811b2a0eec8e1e344018410affb4 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ca6358cc449c57d9e441d4b31b683f80800ecb2cfa4a9fa42ccd78c368552a4 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_05-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91c2fa5c1c04627f5fcf2b0d26a003f9cac7dc2e --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:893d5c655abd8ca1b2b890257644abcaf7a5c1c337fbd15101dabe6a108b451d +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_05-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9748d1898cb59e82651d0fee22455cf429f88a31 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d312f53a5325a0717816cd81491e6970d4e843eab0a09919ecf9f2e92b3c9030 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_06-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2082e93811b72fe24a0fe67c89e19a11b1657cd7 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:420fe5ac02487752ca61180a15c2a3df06569b04eb788147177806dd11041619 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_06-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4615d309ec7f79dfecc5b55279cbcec0b7a12b5d --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fab587f3859fea2f3bfa0412445250105143d006b6605f2eb7749f98ca7528d8 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_07-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..afacc25c03f9946265fd161318cef58f8a73470b --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bd80c93bbf94d7b2a0643db792bc42ee9b96c83b9e7df6fe0c5d8e4f6fd723b +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_07-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70e3c90f49196c1a8db391db06ef4b17e11f2bae --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5c4798d8b9c546de70ad258c2ab794289a2d18ece3426cec2bc77a91dcd9d3b +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_08-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e84f00bc31c7945388951bd8b5013485011c4dd --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abc44008c90fd3d96e4da0964a74c87b5b4706e6b44bf3822f23a83cfebf4280 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_08-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d369d957faed7806afb319979cd6d568e605de75 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e42d2ccc4da5bb25ec532f484c18cb8fcc91073a1457f6862915c25892f3f16 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_09-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15632ec9a4bab5a46737bd3b19fc24fbd61487ef --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8ebd9eb4146b120fc88430020a3daa7cde07af50f940e79522c70efa00e7790 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_09-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84782d93ffcf01d2eaf3f534adf26034bbb53709 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49e0e6c48f56197ec7ce8acd4da34eddabb0d9bee41c2012a4c57fb79ce037ac +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_10-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5cbc348d948b04e4bc319365ab9efeba6c2ed82 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef78ee7e87325ebba3e8c4b704ef3c805670c9f5e2799b1b2c1cb2ce42492d56 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_10-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95a420c4e1fee72b93cfd1fff981e4f3eb68f794 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9edbbc1a882f68e7efde141e5d2bcce15fbec75095ac9af5613a547b9177a10f +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_11-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01385639f8a9b13b190a9852f01078700de40813 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f3618894eaa56c08201d6894d35fbd53203354dbf459503b8d138f9e5b19926 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_11-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b93d94afbd5598be45471ad5b89f49050910702 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e43153594a9da498e6342216ad7bfe36de713e3855013718031b9028f689ccf8 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_12-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74982520f05843fe71011d4bcb7724c55c7a4f56 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1942c41df83e3b2c0dbeb6d0dbeb704e37b492878421d7f03f83caa59c95d82d +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_12-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1c1f5cbbee6b2d4e144a43b994897b11d8d9a7b --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:303acde4d07becc46040d988669fa133c4a495275d79fa947e9ea0a2419349c5 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_13-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d92bfbcf2e25a4573dd7cc276da6c14781585721 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bbb787366f106c6ee61fb9d04b41fd960cef529dc63bcc7a42afac028186078 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_13-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0e9b48c43bc8213a18807665720554572ba8604 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ecc499f318fd02239218c4435f31754ddd647e06ff523df4d3cf9c9fe244333 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_14-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29ebb8d7691d7fba8533991a134f3e78c0d2b7fd --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2dad1672b727c4f9dcef7a890619b9c942c27a3896bd4143f319bcea10026fc +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_14-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..323c3bf218e15d537cd10b6d1983ce63b66838b8 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e3e1c2c80ebd96177f58084368ab1b9dba387794f18dcaf8edd2fbfe5e9c960 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_15-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e5b1f38c23759380bfd19cdafaed4ecfc24842f --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d86cadea6cdbc712ebffdd34a1afcb03c1423013c3f976b2e37bf06f0f5b7da +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_15-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f25e77172eb7f05edf87ec950cde242619e9953 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f55634fd91e57a9fa82a0633ff680c42196344612e8ef18c62191756bba91616 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_16-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3e2f470c0651350b84bd4bd90f1c4572d649280 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039d483ef69598fd67c00d09de14b695306247a9e7746065ba0c119cfc31967b +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_16-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..985249b52742885275d1aa69d7f8327bc36f7d87 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f752409852f2081414723bfde1a162cf5a432f14e8f2d46cfccf65b99789466 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_17-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d9c0eb69832e0bfa4118c565dcaf27b6bb1339d --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c0977dd68afab3d75d8900513752d978298ecef73319ed648d28ff7ed8cd99b +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_17-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ceb2cdebad6ff2208a1a85b00764d26800e2927 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:509555da1d4b2bbe3b686f67ab24a70eb96340f170aa7ad77cc5a3918d404a4d +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_18-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bc05689c15b87fc79c975d9ea3c426cafdc3f49 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6631f1d366129c935481ff32d5f15c586c0d927c4f0c49702e96ad8bccceca45 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_18-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a253bc2f3c6609c3f94c1f3ad8468da91f37ea5 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f68cf6fed8e29a78b9b78306683c78fd42afca8b60a6363b2de9123eee65c69 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_19-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c536e294d747b1f93641ef147a9de3a3735e37f0 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e35576e0d9345600617915d0f3641c0e5da76b37c0f0d780f43f8b24f79a8a10 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_19-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fef3df3674ec5b6af705dafa1c74e928a99dd5a --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:698743267134c5d74ec8e310029d07d30c86157a8f66be52edad8882593128e3 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_20-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3841318d60cd6c9c70ee658962b6f898a12b8303 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96d0650f09921612c18a67dc1aa8290624daca2c4a81252fe5c45b675b0a6829 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_20-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77ae8727dabcdda602e4b43aac24078d9c772f2e --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86ea67e48c6d00dcd4d0a551558c7f2ea9775df6a7a551547a58ca453110f082 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_21-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29bdfb5024ff26429fd6b3cd1359917ed0509ca0 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30ec943ddeb0a7e11b4e9034ee7242b0c46d912d537598185866d6bbefde5727 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_21-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cc5feb7f7e505fa27840ee4994087380d159635 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bce2e74d43ee5faeff78e5789e4da23aabc536294916f85e1127c998fd7024c5 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_22-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52188361cc89ab217640347d2dbeb7fcf9e51302 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:368d97ccf7be35f8b8749ec45080064fadfc199c7e414cfad70af9191e5039a5 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_22-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d1842b530d0cf3e62c33ba55c4a2f46ef399cea --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4610f08bd2e1f8ac8aba83bb75aab387a98698092e712008a833979a1be3456f +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_23-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d727cfaed5c90152b088329a06187c82cef7e744 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96da429a282a67e5a7b4852a4a33ae5b9d086f5ea35a81027a816c172e524f93 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_23-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..480f4230ca103cdb171a2fd67b666ec00f6a1f8f --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10401e9d0105438c5170c68d26e8f4c89c927f7d8a0300e01d0d475bc9c402eb +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_24-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd16687287ca30dd446895f52646a9a93ed210c5 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7161eebcf08ee9976c27006fce40ccd40026dd1c04eeee565621738f87141a54 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_24-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af48390089e705ad6efcc6c302614beaa7a222b2 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceffbe7ec706ba482a4935e5b68b4ae0995c96033a759baec5333ab48c8c6e89 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_25-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2c5385b12d2225a7c2a3bd7f7233a437c9a90b4 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c7a2c4ed92ed0119acc9c1a426c3d9244a17130d2fb1789b0c052dfe6e32eb9 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_25-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32e64fcafd577c5d9cddd2a200a06fd4881cbca2 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20d5dbf1f92efac7ef919c16bb9d42176fc6e06a5def873b96b5e25679a5500f +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_26-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..349e7fe3fd699116e1d4355463a5acce790bce54 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a9d1708e6571399f48f942a9b6e60a654ba5cfcd0145f61e157376cfed79953 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_26-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a2c4dcad7513d596abe507560ae10708982800f --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f874b276b00e4381bb018ba21817877df46231eb0af128af7f78454557999b19 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_27-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaa58a44f94d35d1902a6e21d8612443846b6bc0 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6853b94a694c8678404a4a1d4a27aae54fc8cc1b7ab3dfb2062c9f475f9c857 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_27-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27ccabe2ec9fb2eaec190de3f21542cde354d469 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49e95d2fb34fcc75ab1dc38959f678d1f43bc6694c66a94993740f445b3c9441 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_28-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ea73358495a99024a39590bf76bc24ba99242f2 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd50b1f239e3eaccee732eaa29563d17b98c65f95cbbb56d53cb471ee6a7d14a +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_28-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..283b31d2e9fe1ab4cf94746a76783618e90ffee6 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef8cd075f8c64d5f34f92d5c2bfb3131f21ea997466e62afe599bf8b12ca35a8 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_29-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b6f204be36df226436c66e27a27c7a58aefe68d --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffe30c8ec89a9b9c59788e759e6a5c8fb81ca4a2fa9cdd470c33f5bdb6f6a2d9 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_29-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97b418b55e9cf319283bf2b4a0e36b43720d1402 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11d1b03c5a22186e28b7fe20a73e7df3c7e46e7ebc2519da3d0717256aa8652d +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_30-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65134227147e6f9ebdeb7baa9b0361213266c4f5 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82a96a52a0c65675f2a7be9f7c525aa134454e21893f961ca245be11f7dc9e4a +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_30-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ffdff9cbd957f98e39d459390bd3192782159a0 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45fc0c3ea89938cffb3309e593055811653fdb9b2b1b7e58a3513bbcf736d014 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_31-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eeebbd4a4a43ea0ac8fc0ac8a4e2f985e24c6d52 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee5089d00c3787742877e8aca3b26c6bb0dd189b24ad5da9252554d46161a2a3 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_31-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c0791a78f044398b66a1d325198b43acec97c4f --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06b560a5d39a09a5e8a3a6aa3efff623c1e34e07bb13c2909222a6b528140c48 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_32-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b09dfe479f7d0e07eba50110e6fa005de389753b --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f998cc9eba183ab26860d5e05dd90e57983cf9d0cee00d9bddd4945d6f52eef5 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_32-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7fccf393d5be92db5400690fd85487e89fafda3 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:398b40d195b5c73e3164b7f93e84807a798e6b511ea0f83cd19bcfe38549988a +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_33-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e66168a6aa05e063c0ec2bd3bca1febb6b5192b --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7db2dd020677a4d16bd3b6a2712c52860d655af0a3a6864ceaf00b91d09fb71f +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_33-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cc360237792668f811b3ee36b164448408a2a3a --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9e9b97804daab9d29195f19293fabb51f5aafb39307e572d9c459d4df2145d4 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_34-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fa4c835597b8fc6d82bde82e4c3513faf7018c7 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6090acd50fd727033edbcd4e5cbdb0b7541308f39e7a40a4e81a31279d6b7511 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_34-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d075f01a585a8dc041f07a237b1a6a34779ff05 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6626c3fab1c8a541caf459bb0acb0e4a16ed7fac765e5fd9457e31e1114047dc +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_35-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6d0214695455463d15b02d2f14e642338705eac --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ee41b4d6613f4f84b4fa4c873f5d4a1c30af517a461cd8e26f7e15fc02b4de5 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_35-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9e9db157f08539178ec9c768af6099b0be5051f --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd4806e831dc41507c35e6cf3da69340b6b0b6af65e63cac226effd28cfad312 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_36-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74bd60b1b77a56c5d0c66e4ba9737e3e6dff3194 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40013e276b2126e175e83bd058a98c37402423b655e5cbfce7eb95b4e3797104 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_36-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fe8ea87844b64382da6720fcf384d2e3d27a1cf --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c91b2e29edf54789ae5249497f3864b275468290770792326eb26f0053ff63a8 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_37-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..145cb0d7756da63270e1f04fda727562425d4c08 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad2208bcdba291db1b828c3d1943759668c5ada86da64fb2cad2599a4c6348c4 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_37-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81459a6516ebbb9ef12b428cf362011872996b75 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c4d23d9b400b4aa4b6dd29723875d1597cd85b25b1101386941cdd2c1f048d8 +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_38-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb6cce3e81eaed416d90264885ab6b9985ce1adf --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:977fc18883848727c449375c3e9ffbcacf51776ee7aa13cce81a330fab872e2b +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_38-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af3904a8f4f616b5079b18f3c50baf101ec27305 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ce01f56a91dba76a45122abe3bc687c8714927762b512fdb8bf2864c599849b +size 113308931 diff --git a/4b284b84bc4seed2/global_step80108/layer_40-model_00-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9d524084c429ff7c552abcd05034d5d4b644edc --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a75d5812ea4a81902f145f15195195d9019a3c0f090b5a68b1b5ba7f32aa03a3 +size 13507 diff --git a/4b284b84bc4seed2/global_step80108/layer_40-model_01-model_states.pt b/4b284b84bc4seed2/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07b576d9bdab5894bf166b2eca302f4f7631de4b --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6042f47c6fee661ea0d84c4120878a598e4cb86aa3b998370779fd7239cbeceb +size 13507 diff --git a/4b284b84bc4seed2/global_step80108/mp_rank_00_model_states.pt b/4b284b84bc4seed2/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32519c1c47b6110f7e650969a011e1991d72ff56 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e144ffaaf1cd400581af8f2a38d244b74da36289e5f0ea1e7f55d6182cf8bf8 +size 51443 diff --git a/4b284b84bc4seed2/global_step80108/mp_rank_01_model_states.pt b/4b284b84bc4seed2/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d97e80808cb872fea03422456f3c248c9871600 --- /dev/null +++ b/4b284b84bc4seed2/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79be9a086654387051928a802fa305f281cfec144aa67f480b8e457e5afd6786 +size 51443 diff --git a/4b284b84bc4seed2/transformers/config.json b/4b284b84bc4seed2/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b84bc4seed2/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b84bc4seed2/transformers/pytorch_model.bin b/4b284b84bc4seed2/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..d9670e4d7c30f71ad46dc7d78a8aa0958b9b4420 --- /dev/null +++ b/4b284b84bc4seed2/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eead93c42b705f4b529065cdc9e56f76e9125e7306a609e078bb8468560dfea0 +size 8781203669 diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..acbbe3fcdb835d98469dd500725893a527c143b4 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3778578966148067, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.043108338793946065}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07411555032972421, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001538099367112622}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.309304518659125, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004647036349994307}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11229918414347093, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002038339976908837}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.035405873343107096, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009494477514351852}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.15177029561380864, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032441764358631343}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05373275688087374, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012922653888554133}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07128915442841278, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001421332991618732}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3006366755077802, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004524046109868848}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10836013211520433, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001907062297131903}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07058874999622211, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014347547189524324}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2951817916558195, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004352927117156272}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10699983162704317, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018997512152092622}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..9e83dc74f668007a0a80e7fa3a524d92803c2105 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5559292194446633, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.033063305669521814}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07344134290778047, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013075775283346684}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.38367122642556717, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005374779689077085}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11519017450049537, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001781459047903915}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03451957379808363, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008237357497660324}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1902878844491511, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038667575429744347}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05429955369368683, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001164101537291991}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06953493691658816, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012180136656132438}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.35915530916109556, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004866166233820879}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1089395644753034, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001663152079550431}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0700241015268691, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012535074467763}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.36285521927513625, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004946296798374893}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10966995207767154, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001701230535057806}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e6220e4fc90ac2ded8a819e95df08283349771e2 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5782472127932445, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02876860184072706}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07332998641209827, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012278221285519305}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4051352210429427, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005349246205768158}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11608314556487608, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016856934686361683}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.034072750089738806, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007661045363189041}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20084233643875887, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003927573729716624}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.054101025197296336, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010930137218225489}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.0682789164826936, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00114056254383938}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.36994608434763104, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004671069819142146}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10781733963253654, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015624544135440744}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06944433376851597, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011635802718539946}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3806199258716764, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004907310655807021}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10978895909106065, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015935691932955263}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..7e5e3a5e01ba9c7c301f2f831b7eeb53ebed81f7 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6915008150808406, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03546518672506001}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07432407498828138, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012325917015022579}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4104911461112403, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005343537670914898}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11803876998559919, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017025734287338006}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03485135568208787, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007550726857230097}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20729890874003387, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003943582140548173}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05560964185032228, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001085229952279771}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06880425728281662, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011244989363678815}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.375153241896145, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004712690263932408}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10904814717011492, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015470673139562688}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07034752749731535, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011699863791661837}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3857816920367689, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004912882067435381}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11156419888096808, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016120520944898505}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..33a6b762dadb235ab603108cd401b059960ec720 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7189066936765581, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.037013333820727926}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0746932073820224, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012134517684081734}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.41771020616828414, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0052465481407677345}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11905897645265517, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016851385659147225}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.034925003471357664, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007449043245097383}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21258956488991562, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003996053593134186}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.055971441098147307, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010771389506484157}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06837902016461192, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010967825484641605}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3778018545867543, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00455156041833246}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10871097099572738, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015089792586892492}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07063506078356421, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011518223964322905}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.39341366411170076, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00485926225127653}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11244409077423552, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015904992527627166}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..2e05ece9759f6b22cbe0c7c58d789cff33fd4a47 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7868046756108051, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02991271086752641}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07492512647076705, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0011666617641076609}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4328553245785454, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005279295280429884}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12018582936445632, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016323788305252095}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03506321715356214, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007143804415237641}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.22123976259437653, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003995978607772992}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05660828028959127, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010400981467133133}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06818310395402347, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010562464898575118}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.38959556517516325, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004569300260461267}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10906303355905887, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014559180672523411}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07090266049584355, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001113352975885553}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.4063980496121481, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004844306040632001}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11355384378827522, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001550934113029576}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..68549aee574e15fbbbbd49d4fff8666bb7cf32dc --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15334539415738388, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019222806905930796}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.26182170525230664, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027125088120466567}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1796629653377477, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018831601953688906}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.031909006707834885, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007708990454599334}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05633865948240556, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014288226584569942}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03752338599482476, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008657026414927998}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11977598793404674, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013475259124603452}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.21260047811552407, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002226957170728599}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14212961094234547, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013510429063892365}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13994434092556626, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017396047429116305}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.24051441991616382, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002515699207499435}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16422175879907844, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001702104333489601}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.6474987427065775, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06593859959084909}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..83cb73010e4027c9938135d0d8afc6028b3f245c --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.19811750483825502, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002244284359015066}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.3233361530990366, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027615810059661346}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.22429676008256744, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019215432949986416}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04984071088538675, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011306753133130294}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.08194485459001105, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001676052028304491}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.055270992861272274, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010209237932340483}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.13956446970769343, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001568888728809687}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.23527321502693888, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002186112073171261}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15889068091572497, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012757988630829789}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.18632650105602275, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002136419893250326}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.30435788657049767, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002623892289765707}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.21089500684394413, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001812341485185825}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.786152224873671, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05808815291287487}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..897b29dc8e08307772e6420db1c6536612818365 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.21033059542814828, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002442858582337002}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.32413547755906186, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028003239001999137}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.22937813566648368, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019219764317323842}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.05523685617830656, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012874559073350383}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.08462329830096554, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017673558504113702}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.058712455420886434, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010940197542857381}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1497674533077381, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018524531908293406}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.23560418818517648, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022704842678573766}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.16297597705988986, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013304409687103912}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.19887451626852745, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002331309192885264}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.3069248020961403, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026805984377935225}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.21693278589564352, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018227504624372965}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.230998083062549, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.050797557201713334}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..78991a1f8a522d2dfa24d3aca21dd6dd764150bb --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1806956214983726, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0027831512016435046}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2623447416585146, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0033680997374848517}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1876832021711141, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022940658612174095}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.047673762536966334, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013822773824892138}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0697044253840176, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001729633370079589}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04841722766281516, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011008037910137322}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.13209227506220064, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002157083339054086}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.193574388819157, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0026303701953405384}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13587871163748794, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016337548444324763}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1711795821823165, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002664487441078435}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.24863617061757418, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032228879303417934}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17759916274930226, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021766669356267855}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.2098001105373206, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09099300025969562}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..7440e17d4ae6ae7d9bdce8228a334fe9f318d086 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.05880934489289142, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0022689626423463057}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.08575740200155547, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002995322533624644}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.05909725046757388, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020201095521583104}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.015110877443934299, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000991369440072553}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.022701528371762265, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001245597630024608}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.014955192433241102, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007610692004221399}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.04469761272469577, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018115322606699102}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.06493843037748623, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023175889760991357}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.044050934610035515, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001498662498119108}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.0553855629257085, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021577985213379713}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.08067508006348567, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028298079410380454}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.055485095239080344, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018978766900965142}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.6098983821550592, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.057390083475920894}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..39075a41793c0d42600c378f8bf3487f3f42f3d2 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.009364139423338884, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0010022987284321672}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.014018983768781176, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0013739169170373748}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.009438215462949508, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008930219445271543}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.002554638785654485, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0004139088387696996}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.004058440910233081, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0006059287974265584}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.002492491138928612, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00033796870035768413}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.007004878000531978, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0007704906553010422}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.010728122020319702, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0010948722482846322}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.007008419627805089, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006680187288932387}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.008716167882302485, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0009417371430749615}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.013083621795425198, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0012869514383126801}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.008755675533348816, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0008272404703615799}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 7.585034963472076e-07, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.5369928370922445e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..b1edfa9766fceb7ae788fbe0353a32e701ab3b62 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 2.302445011589307, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06211023865546385}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.12233139227806873, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0010629452092601635}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.25742079610936297, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.001800775093152571}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.16312944483849517, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0012810447257741884}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.030911049123290638, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007417529238496929}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.06285991268008932, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015091563495189734}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.04090223997307209, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009736983422614277}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.12118590550392237, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010248820684599837}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.2555207273914006, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.001760350193080484}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.16171573051604754, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012389880599311676}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.09601857609439678, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0009739557630404562}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.20198211758201637, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0017356209782491401}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.1280356806160262, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0012028446220128677}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c68ee1d31dd829137d82c02a8261636b6de70443 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 9.263924206317883, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07741695657438914}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.46181278849346963, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003686608618192092}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4286623121704012, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003005228287502819}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4034314142097248, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022118879808028843}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2127064486018551, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026018988957500753}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.19238207615248135, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00208794348752037}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.18184691082787147, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018176157547358858}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3491570035267105, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003076016478420658}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3262548928750604, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002559992101041393}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3047130282688444, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018640708877106472}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3805884982861303, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0034128765580002424}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.35050122813254053, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027309493870352275}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.33103396853758926, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002167584950514449}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..1381b00384cacecfdd31297bde1f0cff2eb6a217 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 10.065169479277689, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.13743485776863448}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4521349721323409, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0037077133304098463}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4576969276598449, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002912059970191956}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.41741556545511066, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022731192955223276}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2175791657307876, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026523412395747367}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21609856115013357, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002192652821722558}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19704389881949605, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018909764984676675}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.34696313010753177, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0030525069814565397}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3551058458123904, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00253577560262687}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.32096479784507037, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018970324444313584}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3795245084348248, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003449429352786332}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3815645358661485, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002712452534885871}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.349200751229774, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022493473991314562}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..81181c71898e86d86959a0d467101f4df6c42e98 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.409501258883944, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.200735926048327}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.47359150110281645, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0035801720410154575}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.46852198178337934, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028471977217635184}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4385722344979268, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023100736158786}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.23359678515529092, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026715948188736267}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22730491424875773, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002252917174717242}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.21297415730718317, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002002023485009685}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.36122582263536407, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0030394944731669572}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.35939795651767675, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002511542644538787}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.33437569173005427, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020107174748746504}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3998844531789924, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0033854020792017285}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3938246920292058, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002729767161367992}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.36932279359236814, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023179469576599027}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..96d0e3d9c9c4909908316a6a85b0e8d080eeb6dd --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.452122590183434, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.16404160542943327}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.49497236517824444, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0035535658412753006}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4725995896409827, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028157186492877196}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.45315190664308314, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002278710461652685}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.24812095038732754, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027737064203339212}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2324345352491202, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002259923232212951}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.22316519517459477, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020371724840063865}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3745330183490656, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0030718020025572107}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3585821251012964, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024911676803155646}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34240410488312567, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020393007899216064}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4179948014646539, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0033899691757338438}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3979598039322067, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027471446794053813}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.38201002954999475, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002335148377240596}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..bc48c0e50fc5f237f4a2b8eb2421dacb1eb2af00 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 13.309002924662785, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.24361495936574476}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5055114743909561, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0034029405989093315}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.47439394771123267, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027085795597238727}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.46337099933680953, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022284128767927217}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2543085325831986, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026833318688377957}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.23498034253109115, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022102671857103136}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.22971317638516242, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020276942034306005}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.38203696819305627, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029643784309907667}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.35829625222003997, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002388395524420644}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3493044245188954, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020072603771810445}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4307656306766157, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003270545893660294}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4032599450584402, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026395356242984963}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.39422575829822615, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022790324609071426}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_0.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..3293346e3d8beea2d6717c6a4d308036ba565466 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.15448121328596862, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001977188397188564}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.35997124440611034, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004298205436694583}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2118853569842521, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024831762617585746}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03645241402160218, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011752236536019232}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.08865405071591761, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0029077149755190814}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.05056562034464029, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001595549541223809}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.11766298156431257, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00154525669786904}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.27589374122183485, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034812956688468695}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.161553829612935, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019356026144079317}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.12262950144266513, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016994024464092056}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.28822399594677356, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003908951289350794}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1685758842303753, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002177154066590156}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.061265150562031, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1047194903989246}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_1.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ade11be66fcf84a5700963c563724c785f0f8ba7 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12615666366329323, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019462075646106281}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3075463314111142, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004435681902516454}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17677552083071896, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026150769110123255}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.025631403863087567, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010195570539420784}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0643057936335091, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0025821054535310178}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.036209551359239395, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001431805409098863}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09789606233860006, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014408570567453658}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2409666745294604, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034493105763191037}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1375227449624894, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019568848326575864}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09901294724556717, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015797250447342009}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24365682374976821, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0037520223325616334}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13906823791458356, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002145977759148375}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4701047191488112, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.052325655561989}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_2.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2afbef3164959669577ecbe9bfc4daa4dda24394 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12819697138408215, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001923900850974331}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3131959520911201, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004483015545746866}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17977482443218196, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025982011983283434}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02774216419058187, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010191913758900069}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07049404002692027, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002708125093624563}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03935463682151496, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001450577987245735}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10245043926274368, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014451803861143982}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.251818647068035, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003494519863990314}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14388467760513854, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019644343349970836}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09951049154417256, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015455068687096165}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24565320812202304, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0037974977466490017}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13992101774839874, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002118355649079576}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4983004480453936, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08614156872925424}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_3.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..c26e364c54e1a626195f791258e069447258c2fa --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12507167063309826, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020654668780499437}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.29352230739872903, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0046129265452261245}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1716640710662149, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002692661486106222}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0273731792590075, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001058152769608845}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06719512443269011, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002640278987747084}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0383031309264901, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001471824908387901}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10247899612143699, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016344209712852228}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24201656560824256, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0037826395255217203}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1409323879677072, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00215402254496125}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09654487009443463, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016852992800909113}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2286055088707561, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003922038940141684}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13277160506058835, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002226502076197834}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.5436814601886297, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10599321563006747}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_4.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..f664f8e7dff697be3ba18c4bc2c0ad59d743bb89 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0429708507344084, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0028037413845202774}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.07465376472309838, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004321865151720348}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.04863969374523076, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002793420771992738}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.010519316602496626, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001355747591263505}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.017499542584772765, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015490170099444409}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.011395576090619692, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010345794788431668}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0356382053447805, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002395385288173853}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.060770117722936286, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0034770592750759917}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.039590536804712924, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0022228567744426667}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.035133893923727386, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0024011989607887903}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.059405756146875044, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003457018339558158}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0387553178144167, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022066400343704485}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.7915506170854982, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.13278546480806505}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_5.json b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ebd132499b0f794ecbc9221dd44a218ab193e583 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/agg.4b284b84bc4seed3_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0028705257493446055, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008218246257449791}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0023902360458122112, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.000665569783756533}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.002544363512676877, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0007109896306856554}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.00031292391170304596, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00016477755162714296}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0002616879975370542, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00014932256088281653}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0002809498461785326, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00015434551667733464}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0021053678911906607, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0005892152083882312}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0017230940880273344, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0004664097240871752}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0018550844925242101, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0005069733094142548}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.002095488296127936, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00060247869960542}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.001758329007481808, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0005034233459254993}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.001872065671306264, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0005341865975835362}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 7.197738308121429e-37, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.5261190640932973e-32}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4006bfeb3d67aa0233ed938afc47326bece4a82d --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4301696e0a244fe1ec7eff3ddba464a1754f2eaf49409092f7d6a7795610c7e3 +size 4109836 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0e708e0051fe838772065f2301159c433114123e --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc6e0df55e53537f0dfad3b800c7968931bc455b55ba9fe7b10e43c1946d4aff +size 5155130 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e8e9407011a4080a91a9be67caca29458656dc1b --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea5562722bb3eaade9843f978a12b9cabfcbfae190c89fe6016e5a2d65e44678 +size 6083861 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0fb26fe59931a1e0a876823f8e0f961ba932e826 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c78e6e0a92ecfa1ece1d7bab6bace7f9cf14fccb5f7a7ccb11e23532af27a30c +size 6986348 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..838f5ddef79032fa8703eecd50a516e468102f29 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b55c088651789b0eeda84d840a9fcd4e8e06bcc43977207a804643fa51b50db8 +size 7893808 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1cbdd219e75044959ec858f51d5a0c9fcd2732a3 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b5856440be3628f065858ee107c7f9d3a77f259ce4eca70c8444080c430fd82 +size 8821667 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4ba8e0b550f3c1dfb7a92f3b505f986fc1863e1f --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a5b17537ae8edceb8e3ec1d9026a7270bd24dc4d9298dcf91679c64ea37951d +size 7691336 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2b4417f059925b159ff18abb77589ecdbac63a94 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cef513fc272bec490cb07e87a10bf0941eb0f0e4de8c4639112f3304d4e0cad0 +size 13311457 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5c738a305a993bff9bd92be7c54e6c0c9082f65d --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9133f653d010e334954b8075d14248715d80110f1e88d242255d45a07b15716 +size 18892556 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5569cbb725b222cc836a18da3320a07e817ece95 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30412262d6c1498eea0b2bcb811d812e3279d2e298ea9ca874332bde45131ef8 +size 24303396 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4080e6787e57089ac31077875168eec79b5da8f2 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b75907621956d9c04046ba010fd6c38b1012496ee14fd7454e8b7a36e3188f0a +size 29463282 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b08215dc85c729403b75eaf81b8b4c2f65e61262 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee2ea3552d8b49e6f4adb2d523d0308d0c7380e0481e1011d51da591500769d1 +size 34799022 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5f78ca8f8a3a32cdd3d4bbcb1f5d3e8e20b82508 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cadcececfaeb508c8a6ccaef1673554b5cf4c3ba2a82dc38de7794dc277440d9 +size 4528803 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..89041b06b2887e2663ad7bb444345957efcbc7b4 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9a310bc74a171421712ea61c7b2eafd8f330c431c1412ca983090836c76e36 +size 5150151 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f5822a6aee0b0a44403ed1286a0a4be84c4dd0c1 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51b786bab0bf37e9fd4f51e33649fc5168ed5e65041cea42ae3756d8b0479aca +size 6269954 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a1671211ccaee4bbeb84bd063dc715420ba2c0dc --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a91085009f3d9cc6d894929364aaef09ef5bc935e44a59f6bf4df49fbd6990f0 +size 7324567 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f4939c4388675f21fb10f29f43eac0df0f8532a5 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f45f79fec402c1d5a1439b1b812386da95a205b3e7cc1e97520983dc3c167d9f +size 8374428 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a40487e426c151effae682acca3d82cb00d92ab9 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f61fbbadc64b8221d36a3aa58a10cef6c0cf1bc70b55ab00a19cf257bbe51701 +size 9439924 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_0.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b5f1993773e9ea9b234d5304ee9cb175f185bc1a --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55a6a77ba7997a0609d5e43ada9e6f74111f871354c44211e8750ecc8ed826a0 +size 2828924 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_1.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..13a95b23c3fff3a564e3c728e08a517382dbadb1 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eafa2ee449328f29bb817eafeb827aef47e8d51a0961be041d39026306cf3ec9 +size 5107953 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_2.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f5260cda48eb517cb6e714c58b10748a2dd38b48 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7409ea02f6fe205306f4cf43c414084ce5dbf20f689a5a0a734bff55d35f4cef +size 7381954 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_3.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ecc117c443d8c2d12697b36938064b913be2fe48 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f5afd80646bef170b9eda55acaf34dff75c171a9d7a14aa48254aa8135920b1 +size 9649194 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_4.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d62c64069fb382b287f0c658d3178f1b15d3a1f7 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e40b310fea9e7a56606001b12c3a9bc58752430118cb224f5743f84b3eeb89a3 +size 11672875 diff --git a/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_5.jsonl b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ff44ef3632ac575c464653cdcbf14897f15af2dc --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/examples.4b284b84bc4seed3_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4729f43413b3e6bd1b8f2facd0ffd873f04b5e8ca1fb420ba1ff4c9618e1d3a6 +size 13897528 diff --git a/4b284b84bc4seed3/evaluation/generation/merged.csv b/4b284b84bc4seed3/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..e31ab34c726d6b587d56a833d84dc2ae48ebf259 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.04090223997307209 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.04090223997307209 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.18184691082787147 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.18184691082787147 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.19704389881949605 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.19704389881949605 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.21297415730718317 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.21297415730718317 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.22316519517459477 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.22316519517459477 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.22971317638516242 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.22971317638516242 +e2e_nlg_cleaned,5,average,multiple,0.18094092974789666 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.05056562034464029 +gem_xsum,0,median,rouge2_fmeasure,0.05056562034464029 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.036209551359239395 +gem_xsum,1,median,rouge2_fmeasure,0.036209551359239395 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.03935463682151496 +gem_xsum,2,median,rouge2_fmeasure,0.03935463682151496 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.0383031309264901 +gem_xsum,3,median,rouge2_fmeasure,0.0383031309264901 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.011395576090619692 +gem_xsum,4,median,rouge2_fmeasure,0.011395576090619692 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.0002809498461785326 +gem_xsum,5,median,rouge2_fmeasure,0.0002809498461785326 +gem_xsum,5,average,multiple,0.029351577564780493 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.05373275688087374 +web_nlg_en,0,median,rouge2_fmeasure,0.05373275688087374 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.05429955369368683 +web_nlg_en,1,median,rouge2_fmeasure,0.05429955369368683 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.054101025197296336 +web_nlg_en,2,median,rouge2_fmeasure,0.054101025197296336 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.05560964185032228 +web_nlg_en,3,median,rouge2_fmeasure,0.05560964185032228 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.055971441098147307 +web_nlg_en,4,median,rouge2_fmeasure,0.055971441098147307 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.05660828028959127 +web_nlg_en,5,median,rouge2_fmeasure,0.05660828028959127 +web_nlg_en,5,average,multiple,0.05505378316831963 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.03752338599482476 +wiki_lingua_en,0,median,rouge2_fmeasure,0.03752338599482476 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.055270992861272274 +wiki_lingua_en,1,median,rouge2_fmeasure,0.055270992861272274 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.058712455420886434 +wiki_lingua_en,2,median,rouge2_fmeasure,0.058712455420886434 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.04841722766281516 +wiki_lingua_en,3,median,rouge2_fmeasure,0.04841722766281516 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.014955192433241102 +wiki_lingua_en,4,median,rouge2_fmeasure,0.014955192433241102 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.002492491138928612 +wiki_lingua_en,5,median,rouge2_fmeasure,0.002492491138928612 +wiki_lingua_en,5,average,multiple,0.036228624251994725 diff --git a/4b284b84bc4seed3/evaluation/generation/merged.json b/4b284b84bc4seed3/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..1b68dd614e52a74e89373181744870e529f7c86c --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.3778578966148067, "bleu_stderr": 0.043108338793946065, "rouge1_fmeasure": 0.11229918414347093, "rouge1_fmeasure_stderr": 0.002038339976908837, "rouge1_precision": 0.07411555032972421, "rouge1_precision_stderr": 0.001538099367112622, "rouge1_recall": 0.309304518659125, "rouge1_recall_stderr": 0.004647036349994307, "rouge2_fmeasure": 0.05373275688087374, "rouge2_fmeasure_stderr": 0.0012922653888554133, "rouge2_precision": 0.035405873343107096, "rouge2_precision_stderr": 0.0009494477514351852, "rouge2_recall": 0.15177029561380864, "rouge2_recall_stderr": 0.0032441764358631343, "rougeL_fmeasure": 0.10836013211520433, "rougeL_fmeasure_stderr": 0.001907062297131903, "rougeL_precision": 0.07128915442841278, "rougeL_precision_stderr": 0.001421332991618732, "rougeL_recall": 0.3006366755077802, "rougeL_recall_stderr": 0.004524046109868848, "rougeLsum_fmeasure": 0.10699983162704317, "rougeLsum_fmeasure_stderr": 0.0018997512152092622, "rougeLsum_precision": 0.07058874999622211, "rougeLsum_precision_stderr": 0.0014347547189524324, "rougeLsum_recall": 0.2951817916558195, "rougeLsum_recall_stderr": 0.004352927117156272}}, "1": {"PALM_prompt": {"bleu": 0.5559292194446633, "bleu_stderr": 0.033063305669521814, "rouge1_fmeasure": 0.11519017450049537, "rouge1_fmeasure_stderr": 0.001781459047903915, "rouge1_precision": 0.07344134290778047, "rouge1_precision_stderr": 0.0013075775283346684, "rouge1_recall": 0.38367122642556717, "rouge1_recall_stderr": 0.005374779689077085, "rouge2_fmeasure": 0.05429955369368683, "rouge2_fmeasure_stderr": 0.001164101537291991, "rouge2_precision": 0.03451957379808363, "rouge2_precision_stderr": 0.0008237357497660324, "rouge2_recall": 0.1902878844491511, "rouge2_recall_stderr": 0.0038667575429744347, "rougeL_fmeasure": 0.1089395644753034, "rougeL_fmeasure_stderr": 0.001663152079550431, "rougeL_precision": 0.06953493691658816, "rougeL_precision_stderr": 0.0012180136656132438, "rougeL_recall": 0.35915530916109556, "rougeL_recall_stderr": 0.004866166233820879, "rougeLsum_fmeasure": 0.10966995207767154, "rougeLsum_fmeasure_stderr": 0.001701230535057806, "rougeLsum_precision": 0.0700241015268691, "rougeLsum_precision_stderr": 0.0012535074467763, "rougeLsum_recall": 0.36285521927513625, "rougeLsum_recall_stderr": 0.004946296798374893}}, "2": {"PALM_prompt": {"bleu": 0.5782472127932445, "bleu_stderr": 0.02876860184072706, "rouge1_fmeasure": 0.11608314556487608, "rouge1_fmeasure_stderr": 0.0016856934686361683, "rouge1_precision": 0.07332998641209827, "rouge1_precision_stderr": 0.0012278221285519305, "rouge1_recall": 0.4051352210429427, "rouge1_recall_stderr": 0.005349246205768158, "rouge2_fmeasure": 0.054101025197296336, "rouge2_fmeasure_stderr": 0.0010930137218225489, "rouge2_precision": 0.034072750089738806, "rouge2_precision_stderr": 0.0007661045363189041, "rouge2_recall": 0.20084233643875887, "rouge2_recall_stderr": 0.003927573729716624, "rougeL_fmeasure": 0.10781733963253654, "rougeL_fmeasure_stderr": 0.0015624544135440744, "rougeL_precision": 0.0682789164826936, "rougeL_precision_stderr": 0.00114056254383938, "rougeL_recall": 0.36994608434763104, "rougeL_recall_stderr": 0.004671069819142146, "rougeLsum_fmeasure": 0.10978895909106065, "rougeLsum_fmeasure_stderr": 0.0015935691932955263, "rougeLsum_precision": 0.06944433376851597, "rougeLsum_precision_stderr": 0.0011635802718539946, "rougeLsum_recall": 0.3806199258716764, "rougeLsum_recall_stderr": 0.004907310655807021}}, "3": {"PALM_prompt": {"bleu": 0.6915008150808406, "bleu_stderr": 0.03546518672506001, "rouge1_fmeasure": 0.11803876998559919, "rouge1_fmeasure_stderr": 0.0017025734287338006, "rouge1_precision": 0.07432407498828138, "rouge1_precision_stderr": 0.0012325917015022579, "rouge1_recall": 0.4104911461112403, "rouge1_recall_stderr": 0.005343537670914898, "rouge2_fmeasure": 0.05560964185032228, "rouge2_fmeasure_stderr": 0.001085229952279771, "rouge2_precision": 0.03485135568208787, "rouge2_precision_stderr": 0.0007550726857230097, "rouge2_recall": 0.20729890874003387, "rouge2_recall_stderr": 0.003943582140548173, "rougeL_fmeasure": 0.10904814717011492, "rougeL_fmeasure_stderr": 0.0015470673139562688, "rougeL_precision": 0.06880425728281662, "rougeL_precision_stderr": 0.0011244989363678815, "rougeL_recall": 0.375153241896145, "rougeL_recall_stderr": 0.004712690263932408, "rougeLsum_fmeasure": 0.11156419888096808, "rougeLsum_fmeasure_stderr": 0.0016120520944898505, "rougeLsum_precision": 0.07034752749731535, "rougeLsum_precision_stderr": 0.0011699863791661837, "rougeLsum_recall": 0.3857816920367689, "rougeLsum_recall_stderr": 0.004912882067435381}}, "4": {"PALM_prompt": {"bleu": 0.7189066936765581, "bleu_stderr": 0.037013333820727926, "rouge1_fmeasure": 0.11905897645265517, "rouge1_fmeasure_stderr": 0.0016851385659147225, "rouge1_precision": 0.0746932073820224, "rouge1_precision_stderr": 0.0012134517684081734, "rouge1_recall": 0.41771020616828414, "rouge1_recall_stderr": 0.0052465481407677345, "rouge2_fmeasure": 0.055971441098147307, "rouge2_fmeasure_stderr": 0.0010771389506484157, "rouge2_precision": 0.034925003471357664, "rouge2_precision_stderr": 0.0007449043245097383, "rouge2_recall": 0.21258956488991562, "rouge2_recall_stderr": 0.003996053593134186, "rougeL_fmeasure": 0.10871097099572738, "rougeL_fmeasure_stderr": 0.0015089792586892492, "rougeL_precision": 0.06837902016461192, "rougeL_precision_stderr": 0.0010967825484641605, "rougeL_recall": 0.3778018545867543, "rougeL_recall_stderr": 0.00455156041833246, "rougeLsum_fmeasure": 0.11244409077423552, "rougeLsum_fmeasure_stderr": 0.0015904992527627166, "rougeLsum_precision": 0.07063506078356421, "rougeLsum_precision_stderr": 0.0011518223964322905, "rougeLsum_recall": 0.39341366411170076, "rougeLsum_recall_stderr": 0.00485926225127653}}, "5": {"PALM_prompt": {"bleu": 0.7868046756108051, "bleu_stderr": 0.02991271086752641, "rouge1_fmeasure": 0.12018582936445632, "rouge1_fmeasure_stderr": 0.0016323788305252095, "rouge1_precision": 0.07492512647076705, "rouge1_precision_stderr": 0.0011666617641076609, "rouge1_recall": 0.4328553245785454, "rouge1_recall_stderr": 0.005279295280429884, "rouge2_fmeasure": 0.05660828028959127, "rouge2_fmeasure_stderr": 0.0010400981467133133, "rouge2_precision": 0.03506321715356214, "rouge2_precision_stderr": 0.0007143804415237641, "rouge2_recall": 0.22123976259437653, "rouge2_recall_stderr": 0.003995978607772992, "rougeL_fmeasure": 0.10906303355905887, "rougeL_fmeasure_stderr": 0.0014559180672523411, "rougeL_precision": 0.06818310395402347, "rougeL_precision_stderr": 0.0010562464898575118, "rougeL_recall": 0.38959556517516325, "rougeL_recall_stderr": 0.004569300260461267, "rougeLsum_fmeasure": 0.11355384378827522, "rougeLsum_fmeasure_stderr": 0.001550934113029576, "rougeLsum_precision": 0.07090266049584355, "rougeLsum_precision_stderr": 0.001113352975885553, "rougeLsum_recall": 0.4063980496121481, "rougeLsum_recall_stderr": 0.004844306040632001}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.6474987427065775, "bleu_stderr": 0.06593859959084909, "rouge1_fmeasure": 0.1796629653377477, "rouge1_fmeasure_stderr": 0.0018831601953688906, "rouge1_precision": 0.15334539415738388, "rouge1_precision_stderr": 0.0019222806905930796, "rouge1_recall": 0.26182170525230664, "rouge1_recall_stderr": 0.0027125088120466567, "rouge2_fmeasure": 0.03752338599482476, "rouge2_fmeasure_stderr": 0.0008657026414927998, "rouge2_precision": 0.031909006707834885, "rouge2_precision_stderr": 0.0007708990454599334, "rouge2_recall": 0.05633865948240556, "rouge2_recall_stderr": 0.0014288226584569942, "rougeL_fmeasure": 0.14212961094234547, "rougeL_fmeasure_stderr": 0.0013510429063892365, "rougeL_precision": 0.11977598793404674, "rougeL_precision_stderr": 0.0013475259124603452, "rougeL_recall": 0.21260047811552407, "rougeL_recall_stderr": 0.002226957170728599, "rougeLsum_fmeasure": 0.16422175879907844, "rougeLsum_fmeasure_stderr": 0.001702104333489601, "rougeLsum_precision": 0.13994434092556626, "rougeLsum_precision_stderr": 0.0017396047429116305, "rougeLsum_recall": 0.24051441991616382, "rougeLsum_recall_stderr": 0.002515699207499435}}, "1": {"tldr_en": {"bleu": 2.786152224873671, "bleu_stderr": 0.05808815291287487, "rouge1_fmeasure": 0.22429676008256744, "rouge1_fmeasure_stderr": 0.0019215432949986416, "rouge1_precision": 0.19811750483825502, "rouge1_precision_stderr": 0.002244284359015066, "rouge1_recall": 0.3233361530990366, "rouge1_recall_stderr": 0.0027615810059661346, "rouge2_fmeasure": 0.055270992861272274, "rouge2_fmeasure_stderr": 0.0010209237932340483, "rouge2_precision": 0.04984071088538675, "rouge2_precision_stderr": 0.0011306753133130294, "rouge2_recall": 0.08194485459001105, "rouge2_recall_stderr": 0.001676052028304491, "rougeL_fmeasure": 0.15889068091572497, "rougeL_fmeasure_stderr": 0.0012757988630829789, "rougeL_precision": 0.13956446970769343, "rougeL_precision_stderr": 0.001568888728809687, "rougeL_recall": 0.23527321502693888, "rougeL_recall_stderr": 0.002186112073171261, "rougeLsum_fmeasure": 0.21089500684394413, "rougeLsum_fmeasure_stderr": 0.001812341485185825, "rougeLsum_precision": 0.18632650105602275, "rougeLsum_precision_stderr": 0.002136419893250326, "rougeLsum_recall": 0.30435788657049767, "rougeLsum_recall_stderr": 0.002623892289765707}}, "2": {"tldr_en": {"bleu": 3.230998083062549, "bleu_stderr": 0.050797557201713334, "rouge1_fmeasure": 0.22937813566648368, "rouge1_fmeasure_stderr": 0.0019219764317323842, "rouge1_precision": 0.21033059542814828, "rouge1_precision_stderr": 0.002442858582337002, "rouge1_recall": 0.32413547755906186, "rouge1_recall_stderr": 0.0028003239001999137, "rouge2_fmeasure": 0.058712455420886434, "rouge2_fmeasure_stderr": 0.0010940197542857381, "rouge2_precision": 0.05523685617830656, "rouge2_precision_stderr": 0.0012874559073350383, "rouge2_recall": 0.08462329830096554, "rouge2_recall_stderr": 0.0017673558504113702, "rougeL_fmeasure": 0.16297597705988986, "rougeL_fmeasure_stderr": 0.0013304409687103912, "rougeL_precision": 0.1497674533077381, "rougeL_precision_stderr": 0.0018524531908293406, "rougeL_recall": 0.23560418818517648, "rougeL_recall_stderr": 0.0022704842678573766, "rougeLsum_fmeasure": 0.21693278589564352, "rougeLsum_fmeasure_stderr": 0.0018227504624372965, "rougeLsum_precision": 0.19887451626852745, "rougeLsum_precision_stderr": 0.002331309192885264, "rougeLsum_recall": 0.3069248020961403, "rougeLsum_recall_stderr": 0.0026805984377935225}}, "3": {"tldr_en": {"bleu": 3.2098001105373206, "bleu_stderr": 0.09099300025969562, "rouge1_fmeasure": 0.1876832021711141, "rouge1_fmeasure_stderr": 0.0022940658612174095, "rouge1_precision": 0.1806956214983726, "rouge1_precision_stderr": 0.0027831512016435046, "rouge1_recall": 0.2623447416585146, "rouge1_recall_stderr": 0.0033680997374848517, "rouge2_fmeasure": 0.04841722766281516, "rouge2_fmeasure_stderr": 0.0011008037910137322, "rouge2_precision": 0.047673762536966334, "rouge2_precision_stderr": 0.0013822773824892138, "rouge2_recall": 0.0697044253840176, "rouge2_recall_stderr": 0.001729633370079589, "rougeL_fmeasure": 0.13587871163748794, "rougeL_fmeasure_stderr": 0.0016337548444324763, "rougeL_precision": 0.13209227506220064, "rougeL_precision_stderr": 0.002157083339054086, "rougeL_recall": 0.193574388819157, "rougeL_recall_stderr": 0.0026303701953405384, "rougeLsum_fmeasure": 0.17759916274930226, "rougeLsum_fmeasure_stderr": 0.0021766669356267855, "rougeLsum_precision": 0.1711795821823165, "rougeLsum_precision_stderr": 0.002664487441078435, "rougeLsum_recall": 0.24863617061757418, "rougeLsum_recall_stderr": 0.0032228879303417934}}, "4": {"tldr_en": {"bleu": 0.6098983821550592, "bleu_stderr": 0.057390083475920894, "rouge1_fmeasure": 0.05909725046757388, "rouge1_fmeasure_stderr": 0.0020201095521583104, "rouge1_precision": 0.05880934489289142, "rouge1_precision_stderr": 0.0022689626423463057, "rouge1_recall": 0.08575740200155547, "rouge1_recall_stderr": 0.002995322533624644, "rouge2_fmeasure": 0.014955192433241102, "rouge2_fmeasure_stderr": 0.0007610692004221399, "rouge2_precision": 0.015110877443934299, "rouge2_precision_stderr": 0.000991369440072553, "rouge2_recall": 0.022701528371762265, "rouge2_recall_stderr": 0.001245597630024608, "rougeL_fmeasure": 0.044050934610035515, "rougeL_fmeasure_stderr": 0.001498662498119108, "rougeL_precision": 0.04469761272469577, "rougeL_precision_stderr": 0.0018115322606699102, "rougeL_recall": 0.06493843037748623, "rougeL_recall_stderr": 0.0023175889760991357, "rougeLsum_fmeasure": 0.055485095239080344, "rougeLsum_fmeasure_stderr": 0.0018978766900965142, "rougeLsum_precision": 0.0553855629257085, "rougeLsum_precision_stderr": 0.0021577985213379713, "rougeLsum_recall": 0.08067508006348567, "rougeLsum_recall_stderr": 0.0028298079410380454}}, "5": {"tldr_en": {"bleu": 7.585034963472076e-07, "bleu_stderr": 1.5369928370922445e-06, "rouge1_fmeasure": 0.009438215462949508, "rouge1_fmeasure_stderr": 0.0008930219445271543, "rouge1_precision": 0.009364139423338884, "rouge1_precision_stderr": 0.0010022987284321672, "rouge1_recall": 0.014018983768781176, "rouge1_recall_stderr": 0.0013739169170373748, "rouge2_fmeasure": 0.002492491138928612, "rouge2_fmeasure_stderr": 0.00033796870035768413, "rouge2_precision": 0.002554638785654485, "rouge2_precision_stderr": 0.0004139088387696996, "rouge2_recall": 0.004058440910233081, "rouge2_recall_stderr": 0.0006059287974265584, "rougeL_fmeasure": 0.007008419627805089, "rougeL_fmeasure_stderr": 0.0006680187288932387, "rougeL_precision": 0.007004878000531978, "rougeL_precision_stderr": 0.0007704906553010422, "rougeL_recall": 0.010728122020319702, "rougeL_recall_stderr": 0.0010948722482846322, "rougeLsum_fmeasure": 0.008755675533348816, "rougeLsum_fmeasure_stderr": 0.0008272404703615799, "rougeLsum_precision": 0.008716167882302485, "rougeLsum_precision_stderr": 0.0009417371430749615, "rougeLsum_recall": 0.013083621795425198, "rougeLsum_recall_stderr": 0.0012869514383126801}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 2.302445011589307, "bleu_stderr": 0.06211023865546385, "rouge1_fmeasure": 0.16312944483849517, "rouge1_fmeasure_stderr": 0.0012810447257741884, "rouge1_precision": 0.12233139227806873, "rouge1_precision_stderr": 0.0010629452092601635, "rouge1_recall": 0.25742079610936297, "rouge1_recall_stderr": 0.001800775093152571, "rouge2_fmeasure": 0.04090223997307209, "rouge2_fmeasure_stderr": 0.0009736983422614277, "rouge2_precision": 0.030911049123290638, "rouge2_precision_stderr": 0.0007417529238496929, "rouge2_recall": 0.06285991268008932, "rouge2_recall_stderr": 0.0015091563495189734, "rougeL_fmeasure": 0.16171573051604754, "rougeL_fmeasure_stderr": 0.0012389880599311676, "rougeL_precision": 0.12118590550392237, "rougeL_precision_stderr": 0.0010248820684599837, "rougeL_recall": 0.2555207273914006, "rougeL_recall_stderr": 0.001760350193080484, "rougeLsum_fmeasure": 0.1280356806160262, "rougeLsum_fmeasure_stderr": 0.0012028446220128677, "rougeLsum_precision": 0.09601857609439678, "rougeLsum_precision_stderr": 0.0009739557630404562, "rougeLsum_recall": 0.20198211758201637, "rougeLsum_recall_stderr": 0.0017356209782491401}}, "1": {"generate_text_restaurant": {"bleu": 9.263924206317883, "bleu_stderr": 0.07741695657438914, "rouge1_fmeasure": 0.4034314142097248, "rouge1_fmeasure_stderr": 0.0022118879808028843, "rouge1_precision": 0.46181278849346963, "rouge1_precision_stderr": 0.003686608618192092, "rouge1_recall": 0.4286623121704012, "rouge1_recall_stderr": 0.003005228287502819, "rouge2_fmeasure": 0.18184691082787147, "rouge2_fmeasure_stderr": 0.0018176157547358858, "rouge2_precision": 0.2127064486018551, "rouge2_precision_stderr": 0.0026018988957500753, "rouge2_recall": 0.19238207615248135, "rouge2_recall_stderr": 0.00208794348752037, "rougeL_fmeasure": 0.3047130282688444, "rougeL_fmeasure_stderr": 0.0018640708877106472, "rougeL_precision": 0.3491570035267105, "rougeL_precision_stderr": 0.003076016478420658, "rougeL_recall": 0.3262548928750604, "rougeL_recall_stderr": 0.002559992101041393, "rougeLsum_fmeasure": 0.33103396853758926, "rougeLsum_fmeasure_stderr": 0.002167584950514449, "rougeLsum_precision": 0.3805884982861303, "rougeLsum_precision_stderr": 0.0034128765580002424, "rougeLsum_recall": 0.35050122813254053, "rougeLsum_recall_stderr": 0.0027309493870352275}}, "2": {"generate_text_restaurant": {"bleu": 10.065169479277689, "bleu_stderr": 0.13743485776863448, "rouge1_fmeasure": 0.41741556545511066, "rouge1_fmeasure_stderr": 0.0022731192955223276, "rouge1_precision": 0.4521349721323409, "rouge1_precision_stderr": 0.0037077133304098463, "rouge1_recall": 0.4576969276598449, "rouge1_recall_stderr": 0.002912059970191956, "rouge2_fmeasure": 0.19704389881949605, "rouge2_fmeasure_stderr": 0.0018909764984676675, "rouge2_precision": 0.2175791657307876, "rouge2_precision_stderr": 0.0026523412395747367, "rouge2_recall": 0.21609856115013357, "rouge2_recall_stderr": 0.002192652821722558, "rougeL_fmeasure": 0.32096479784507037, "rougeL_fmeasure_stderr": 0.0018970324444313584, "rougeL_precision": 0.34696313010753177, "rougeL_precision_stderr": 0.0030525069814565397, "rougeL_recall": 0.3551058458123904, "rougeL_recall_stderr": 0.00253577560262687, "rougeLsum_fmeasure": 0.349200751229774, "rougeLsum_fmeasure_stderr": 0.0022493473991314562, "rougeLsum_precision": 0.3795245084348248, "rougeLsum_precision_stderr": 0.003449429352786332, "rougeLsum_recall": 0.3815645358661485, "rougeLsum_recall_stderr": 0.002712452534885871}}, "3": {"generate_text_restaurant": {"bleu": 11.409501258883944, "bleu_stderr": 0.200735926048327, "rouge1_fmeasure": 0.4385722344979268, "rouge1_fmeasure_stderr": 0.0023100736158786, "rouge1_precision": 0.47359150110281645, "rouge1_precision_stderr": 0.0035801720410154575, "rouge1_recall": 0.46852198178337934, "rouge1_recall_stderr": 0.0028471977217635184, "rouge2_fmeasure": 0.21297415730718317, "rouge2_fmeasure_stderr": 0.002002023485009685, "rouge2_precision": 0.23359678515529092, "rouge2_precision_stderr": 0.0026715948188736267, "rouge2_recall": 0.22730491424875773, "rouge2_recall_stderr": 0.002252917174717242, "rougeL_fmeasure": 0.33437569173005427, "rougeL_fmeasure_stderr": 0.0020107174748746504, "rougeL_precision": 0.36122582263536407, "rougeL_precision_stderr": 0.0030394944731669572, "rougeL_recall": 0.35939795651767675, "rougeL_recall_stderr": 0.002511542644538787, "rougeLsum_fmeasure": 0.36932279359236814, "rougeLsum_fmeasure_stderr": 0.0023179469576599027, "rougeLsum_precision": 0.3998844531789924, "rougeLsum_precision_stderr": 0.0033854020792017285, "rougeLsum_recall": 0.3938246920292058, "rougeLsum_recall_stderr": 0.002729767161367992}}, "4": {"generate_text_restaurant": {"bleu": 12.452122590183434, "bleu_stderr": 0.16404160542943327, "rouge1_fmeasure": 0.45315190664308314, "rouge1_fmeasure_stderr": 0.002278710461652685, "rouge1_precision": 0.49497236517824444, "rouge1_precision_stderr": 0.0035535658412753006, "rouge1_recall": 0.4725995896409827, "rouge1_recall_stderr": 0.0028157186492877196, "rouge2_fmeasure": 0.22316519517459477, "rouge2_fmeasure_stderr": 0.0020371724840063865, "rouge2_precision": 0.24812095038732754, "rouge2_precision_stderr": 0.0027737064203339212, "rouge2_recall": 0.2324345352491202, "rouge2_recall_stderr": 0.002259923232212951, "rougeL_fmeasure": 0.34240410488312567, "rougeL_fmeasure_stderr": 0.0020393007899216064, "rougeL_precision": 0.3745330183490656, "rougeL_precision_stderr": 0.0030718020025572107, "rougeL_recall": 0.3585821251012964, "rougeL_recall_stderr": 0.0024911676803155646, "rougeLsum_fmeasure": 0.38201002954999475, "rougeLsum_fmeasure_stderr": 0.002335148377240596, "rougeLsum_precision": 0.4179948014646539, "rougeLsum_precision_stderr": 0.0033899691757338438, "rougeLsum_recall": 0.3979598039322067, "rougeLsum_recall_stderr": 0.0027471446794053813}}, "5": {"generate_text_restaurant": {"bleu": 13.309002924662785, "bleu_stderr": 0.24361495936574476, "rouge1_fmeasure": 0.46337099933680953, "rouge1_fmeasure_stderr": 0.0022284128767927217, "rouge1_precision": 0.5055114743909561, "rouge1_precision_stderr": 0.0034029405989093315, "rouge1_recall": 0.47439394771123267, "rouge1_recall_stderr": 0.0027085795597238727, "rouge2_fmeasure": 0.22971317638516242, "rouge2_fmeasure_stderr": 0.0020276942034306005, "rouge2_precision": 0.2543085325831986, "rouge2_precision_stderr": 0.0026833318688377957, "rouge2_recall": 0.23498034253109115, "rouge2_recall_stderr": 0.0022102671857103136, "rougeL_fmeasure": 0.3493044245188954, "rougeL_fmeasure_stderr": 0.0020072603771810445, "rougeL_precision": 0.38203696819305627, "rougeL_precision_stderr": 0.0029643784309907667, "rougeL_recall": 0.35829625222003997, "rougeL_recall_stderr": 0.002388395524420644, "rougeLsum_fmeasure": 0.39422575829822615, "rougeLsum_fmeasure_stderr": 0.0022790324609071426, "rougeLsum_precision": 0.4307656306766157, "rougeLsum_precision_stderr": 0.003270545893660294, "rougeLsum_recall": 0.4032599450584402, "rougeLsum_recall_stderr": 0.0026395356242984963}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 2.061265150562031, "bleu_stderr": 0.1047194903989246, "rouge1_fmeasure": 0.2118853569842521, "rouge1_fmeasure_stderr": 0.0024831762617585746, "rouge1_precision": 0.15448121328596862, "rouge1_precision_stderr": 0.001977188397188564, "rouge1_recall": 0.35997124440611034, "rouge1_recall_stderr": 0.004298205436694583, "rouge2_fmeasure": 0.05056562034464029, "rouge2_fmeasure_stderr": 0.001595549541223809, "rouge2_precision": 0.03645241402160218, "rouge2_precision_stderr": 0.0011752236536019232, "rouge2_recall": 0.08865405071591761, "rouge2_recall_stderr": 0.0029077149755190814, "rougeL_fmeasure": 0.161553829612935, "rougeL_fmeasure_stderr": 0.0019356026144079317, "rougeL_precision": 0.11766298156431257, "rougeL_precision_stderr": 0.00154525669786904, "rougeL_recall": 0.27589374122183485, "rougeL_recall_stderr": 0.0034812956688468695, "rougeLsum_fmeasure": 0.1685758842303753, "rougeLsum_fmeasure_stderr": 0.002177154066590156, "rougeLsum_precision": 0.12262950144266513, "rougeLsum_precision_stderr": 0.0016994024464092056, "rougeLsum_recall": 0.28822399594677356, "rougeLsum_recall_stderr": 0.003908951289350794}}, "1": {"article_DOC_summary": {"bleu": 1.4701047191488112, "bleu_stderr": 0.052325655561989, "rouge1_fmeasure": 0.17677552083071896, "rouge1_fmeasure_stderr": 0.0026150769110123255, "rouge1_precision": 0.12615666366329323, "rouge1_precision_stderr": 0.0019462075646106281, "rouge1_recall": 0.3075463314111142, "rouge1_recall_stderr": 0.004435681902516454, "rouge2_fmeasure": 0.036209551359239395, "rouge2_fmeasure_stderr": 0.001431805409098863, "rouge2_precision": 0.025631403863087567, "rouge2_precision_stderr": 0.0010195570539420784, "rouge2_recall": 0.0643057936335091, "rouge2_recall_stderr": 0.0025821054535310178, "rougeL_fmeasure": 0.1375227449624894, "rougeL_fmeasure_stderr": 0.0019568848326575864, "rougeL_precision": 0.09789606233860006, "rougeL_precision_stderr": 0.0014408570567453658, "rougeL_recall": 0.2409666745294604, "rougeL_recall_stderr": 0.0034493105763191037, "rougeLsum_fmeasure": 0.13906823791458356, "rougeLsum_fmeasure_stderr": 0.002145977759148375, "rougeLsum_precision": 0.09901294724556717, "rougeLsum_precision_stderr": 0.0015797250447342009, "rougeLsum_recall": 0.24365682374976821, "rougeLsum_recall_stderr": 0.0037520223325616334}}, "2": {"article_DOC_summary": {"bleu": 1.4983004480453936, "bleu_stderr": 0.08614156872925424, "rouge1_fmeasure": 0.17977482443218196, "rouge1_fmeasure_stderr": 0.0025982011983283434, "rouge1_precision": 0.12819697138408215, "rouge1_precision_stderr": 0.001923900850974331, "rouge1_recall": 0.3131959520911201, "rouge1_recall_stderr": 0.004483015545746866, "rouge2_fmeasure": 0.03935463682151496, "rouge2_fmeasure_stderr": 0.001450577987245735, "rouge2_precision": 0.02774216419058187, "rouge2_precision_stderr": 0.0010191913758900069, "rouge2_recall": 0.07049404002692027, "rouge2_recall_stderr": 0.002708125093624563, "rougeL_fmeasure": 0.14388467760513854, "rougeL_fmeasure_stderr": 0.0019644343349970836, "rougeL_precision": 0.10245043926274368, "rougeL_precision_stderr": 0.0014451803861143982, "rougeL_recall": 0.251818647068035, "rougeL_recall_stderr": 0.003494519863990314, "rougeLsum_fmeasure": 0.13992101774839874, "rougeLsum_fmeasure_stderr": 0.002118355649079576, "rougeLsum_precision": 0.09951049154417256, "rougeLsum_precision_stderr": 0.0015455068687096165, "rougeLsum_recall": 0.24565320812202304, "rougeLsum_recall_stderr": 0.0037974977466490017}}, "3": {"article_DOC_summary": {"bleu": 1.5436814601886297, "bleu_stderr": 0.10599321563006747, "rouge1_fmeasure": 0.1716640710662149, "rouge1_fmeasure_stderr": 0.002692661486106222, "rouge1_precision": 0.12507167063309826, "rouge1_precision_stderr": 0.0020654668780499437, "rouge1_recall": 0.29352230739872903, "rouge1_recall_stderr": 0.0046129265452261245, "rouge2_fmeasure": 0.0383031309264901, "rouge2_fmeasure_stderr": 0.001471824908387901, "rouge2_precision": 0.0273731792590075, "rouge2_precision_stderr": 0.001058152769608845, "rouge2_recall": 0.06719512443269011, "rouge2_recall_stderr": 0.002640278987747084, "rougeL_fmeasure": 0.1409323879677072, "rougeL_fmeasure_stderr": 0.00215402254496125, "rougeL_precision": 0.10247899612143699, "rougeL_precision_stderr": 0.0016344209712852228, "rougeL_recall": 0.24201656560824256, "rougeL_recall_stderr": 0.0037826395255217203, "rougeLsum_fmeasure": 0.13277160506058835, "rougeLsum_fmeasure_stderr": 0.002226502076197834, "rougeLsum_precision": 0.09654487009443463, "rougeLsum_precision_stderr": 0.0016852992800909113, "rougeLsum_recall": 0.2286055088707561, "rougeLsum_recall_stderr": 0.003922038940141684}}, "4": {"article_DOC_summary": {"bleu": 0.7915506170854982, "bleu_stderr": 0.13278546480806505, "rouge1_fmeasure": 0.04863969374523076, "rouge1_fmeasure_stderr": 0.002793420771992738, "rouge1_precision": 0.0429708507344084, "rouge1_precision_stderr": 0.0028037413845202774, "rouge1_recall": 0.07465376472309838, "rouge1_recall_stderr": 0.004321865151720348, "rouge2_fmeasure": 0.011395576090619692, "rouge2_fmeasure_stderr": 0.0010345794788431668, "rouge2_precision": 0.010519316602496626, "rouge2_precision_stderr": 0.001355747591263505, "rouge2_recall": 0.017499542584772765, "rouge2_recall_stderr": 0.0015490170099444409, "rougeL_fmeasure": 0.039590536804712924, "rougeL_fmeasure_stderr": 0.0022228567744426667, "rougeL_precision": 0.0356382053447805, "rougeL_precision_stderr": 0.002395385288173853, "rougeL_recall": 0.060770117722936286, "rougeL_recall_stderr": 0.0034770592750759917, "rougeLsum_fmeasure": 0.0387553178144167, "rougeLsum_fmeasure_stderr": 0.0022066400343704485, "rougeLsum_precision": 0.035133893923727386, "rougeLsum_precision_stderr": 0.0024011989607887903, "rougeLsum_recall": 0.059405756146875044, "rougeLsum_recall_stderr": 0.003457018339558158}}, "5": {"article_DOC_summary": {"bleu": 7.197738308121429e-37, "bleu_stderr": 1.5261190640932973e-32, "rouge1_fmeasure": 0.002544363512676877, "rouge1_fmeasure_stderr": 0.0007109896306856554, "rouge1_precision": 0.0028705257493446055, "rouge1_precision_stderr": 0.0008218246257449791, "rouge1_recall": 0.0023902360458122112, "rouge1_recall_stderr": 0.000665569783756533, "rouge2_fmeasure": 0.0002809498461785326, "rouge2_fmeasure_stderr": 0.00015434551667733464, "rouge2_precision": 0.00031292391170304596, "rouge2_precision_stderr": 0.00016477755162714296, "rouge2_recall": 0.0002616879975370542, "rouge2_recall_stderr": 0.00014932256088281653, "rougeL_fmeasure": 0.0018550844925242101, "rougeL_fmeasure_stderr": 0.0005069733094142548, "rougeL_precision": 0.0021053678911906607, "rougeL_precision_stderr": 0.0005892152083882312, "rougeL_recall": 0.0017230940880273344, "rougeL_recall_stderr": 0.0004664097240871752, "rougeLsum_fmeasure": 0.001872065671306264, "rougeLsum_fmeasure_stderr": 0.0005341865975835362, "rougeLsum_precision": 0.002095488296127936, "rougeLsum_precision_stderr": 0.00060247869960542, "rougeLsum_recall": 0.001758329007481808, "rougeLsum_recall_stderr": 0.0005034233459254993}}}} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..8f83ca0b80b9dbaf4c921c2f6d1fadd5ba00d8f5 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3778578966148067, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.043108338793946065 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07411555032972421, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001538099367112622 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.309304518659125, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004647036349994307 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11229918414347093, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002038339976908837 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.035405873343107096, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009494477514351852 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.15177029561380864, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032441764358631343 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05373275688087374, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012922653888554133 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07128915442841278, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001421332991618732 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3006366755077802, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004524046109868848 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10836013211520433, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001907062297131903 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07058874999622211, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014347547189524324 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2951817916558195, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004352927117156272 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10699983162704317, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018997512152092622 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..da218e699cb4c55ee8c190a623529ded36ba4132 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5559292194446633, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.033063305669521814 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07344134290778047, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013075775283346684 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.38367122642556717, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005374779689077085 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11519017450049537, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001781459047903915 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03451957379808363, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008237357497660324 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1902878844491511, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038667575429744347 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05429955369368683, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001164101537291991 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06953493691658816, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012180136656132438 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.35915530916109556, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004866166233820879 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1089395644753034, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001663152079550431 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0700241015268691, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012535074467763 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.36285521927513625, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004946296798374893 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10966995207767154, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001701230535057806 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e1e8770ee8a7d52e5cb3133f66c469967b18059d --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5782472127932445, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02876860184072706 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07332998641209827, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012278221285519305 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4051352210429427, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005349246205768158 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11608314556487608, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016856934686361683 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.034072750089738806, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007661045363189041 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20084233643875887, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003927573729716624 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.054101025197296336, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010930137218225489 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.0682789164826936, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00114056254383938 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.36994608434763104, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004671069819142146 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10781733963253654, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015624544135440744 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06944433376851597, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011635802718539946 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3806199258716764, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004907310655807021 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10978895909106065, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015935691932955263 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..d10f2cfe437d2237cac492849c5f25091974a775 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6915008150808406, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03546518672506001 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07432407498828138, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012325917015022579 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4104911461112403, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005343537670914898 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11803876998559919, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017025734287338006 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03485135568208787, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007550726857230097 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20729890874003387, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003943582140548173 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05560964185032228, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001085229952279771 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06880425728281662, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011244989363678815 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.375153241896145, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004712690263932408 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10904814717011492, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015470673139562688 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07034752749731535, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011699863791661837 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3857816920367689, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004912882067435381 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11156419888096808, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016120520944898505 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..6deb2e0002115db025dfc60067e111f6fa8e176c --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7189066936765581, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.037013333820727926 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0746932073820224, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012134517684081734 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.41771020616828414, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0052465481407677345 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11905897645265517, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016851385659147225 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.034925003471357664, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007449043245097383 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21258956488991562, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003996053593134186 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.055971441098147307, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010771389506484157 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06837902016461192, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010967825484641605 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3778018545867543, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00455156041833246 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10871097099572738, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015089792586892492 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07063506078356421, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011518223964322905 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.39341366411170076, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00485926225127653 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11244409077423552, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015904992527627166 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..3896c8d0771d6f7e049dbed596826d8307853825 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7868046756108051, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02991271086752641 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07492512647076705, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0011666617641076609 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4328553245785454, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005279295280429884 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12018582936445632, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016323788305252095 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03506321715356214, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007143804415237641 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.22123976259437653, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003995978607772992 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05660828028959127, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010400981467133133 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06818310395402347, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010562464898575118 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.38959556517516325, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004569300260461267 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10906303355905887, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014559180672523411 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07090266049584355, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001113352975885553 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.4063980496121481, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004844306040632001 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11355384378827522, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001550934113029576 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..87aef70020af18a1a39ebf2a5c2621918521f7f2 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15334539415738388, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019222806905930796 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.26182170525230664, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0027125088120466567 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1796629653377477, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018831601953688906 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.031909006707834885, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007708990454599334 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05633865948240556, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014288226584569942 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03752338599482476, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008657026414927998 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11977598793404674, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013475259124603452 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.21260047811552407, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002226957170728599 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14212961094234547, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013510429063892365 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13994434092556626, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017396047429116305 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.24051441991616382, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002515699207499435 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16422175879907844, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001702104333489601 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.6474987427065775, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06593859959084909 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..d523fb5d9d597015d2272b2fbbf5e82098210716 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.19811750483825502, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002244284359015066 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.3233361530990366, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0027615810059661346 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.22429676008256744, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019215432949986416 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04984071088538675, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011306753133130294 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.08194485459001105, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001676052028304491 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.055270992861272274, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010209237932340483 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.13956446970769343, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001568888728809687 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.23527321502693888, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002186112073171261 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15889068091572497, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012757988630829789 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.18632650105602275, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002136419893250326 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.30435788657049767, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002623892289765707 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.21089500684394413, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001812341485185825 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.786152224873671, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05808815291287487 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..f4425fe4b37f7515c9901877feeaf6dfb2796247 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.21033059542814828, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002442858582337002 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.32413547755906186, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028003239001999137 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.22937813566648368, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019219764317323842 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.05523685617830656, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0012874559073350383 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.08462329830096554, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0017673558504113702 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.058712455420886434, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010940197542857381 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1497674533077381, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0018524531908293406 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.23560418818517648, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022704842678573766 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.16297597705988986, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013304409687103912 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.19887451626852745, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002331309192885264 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.3069248020961403, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026805984377935225 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.21693278589564352, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018227504624372965 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.230998083062549, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.050797557201713334 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a3706242261cd8eb683bd0bbde5a59b510d103e2 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1806956214983726, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0027831512016435046 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2623447416585146, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0033680997374848517 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1876832021711141, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0022940658612174095 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.047673762536966334, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0013822773824892138 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0697044253840176, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001729633370079589 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04841722766281516, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011008037910137322 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.13209227506220064, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002157083339054086 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.193574388819157, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0026303701953405384 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13587871163748794, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016337548444324763 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1711795821823165, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002664487441078435 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.24863617061757418, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0032228879303417934 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17759916274930226, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021766669356267855 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.2098001105373206, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09099300025969562 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..50d272f6fb627222d1a7dd726ec4fc465d380f0e --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.05880934489289142, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0022689626423463057 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.08575740200155547, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002995322533624644 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.05909725046757388, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020201095521583104 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.015110877443934299, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000991369440072553 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.022701528371762265, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001245597630024608 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.014955192433241102, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007610692004221399 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.04469761272469577, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0018115322606699102 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.06493843037748623, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0023175889760991357 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.044050934610035515, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001498662498119108 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.0553855629257085, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0021577985213379713 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.08067508006348567, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0028298079410380454 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.055485095239080344, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018978766900965142 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.6098983821550592, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.057390083475920894 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..020ee16a31a7cd2b45834c7e8c8b50fe74e9c5db --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.009364139423338884, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0010022987284321672 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.014018983768781176, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0013739169170373748 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.009438215462949508, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0008930219445271543 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.002554638785654485, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0004139088387696996 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.004058440910233081, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0006059287974265584 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.002492491138928612, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00033796870035768413 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.007004878000531978, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0007704906553010422 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.010728122020319702, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0010948722482846322 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.007008419627805089, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006680187288932387 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.008716167882302485, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0009417371430749615 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.013083621795425198, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0012869514383126801 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.008755675533348816, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0008272404703615799 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 7.585034963472076e-07, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 1.5369928370922445e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..976bb2caa4af456a970c71978bf68c70b9f7bed0 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 2.302445011589307, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.06211023865546385 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.12233139227806873, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0010629452092601635 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.25742079610936297, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.001800775093152571 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.16312944483849517, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0012810447257741884 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.030911049123290638, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0007417529238496929 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.06285991268008932, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0015091563495189734 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.04090223997307209, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0009736983422614277 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.12118590550392237, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0010248820684599837 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.2555207273914006, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.001760350193080484 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.16171573051604754, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0012389880599311676 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.09601857609439678, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0009739557630404562 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.20198211758201637, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0017356209782491401 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.1280356806160262, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0012028446220128677 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..91f3c90d02cc1d52bbeb283051af76d6fc4de024 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 9.263924206317883, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.07741695657438914 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.46181278849346963, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003686608618192092 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4286623121704012, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.003005228287502819 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4034314142097248, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022118879808028843 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2127064486018551, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026018988957500753 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.19238207615248135, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.00208794348752037 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.18184691082787147, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018176157547358858 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3491570035267105, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.003076016478420658 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3262548928750604, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002559992101041393 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3047130282688444, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0018640708877106472 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3805884982861303, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0034128765580002424 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.35050122813254053, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027309493870352275 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.33103396853758926, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002167584950514449 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..c6e6f86c3fe42fa6637c7a4380d3ccca0540f953 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 10.065169479277689, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.13743485776863448 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4521349721323409, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0037077133304098463 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4576969276598449, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002912059970191956 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.41741556545511066, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022731192955223276 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2175791657307876, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026523412395747367 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21609856115013357, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002192652821722558 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19704389881949605, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018909764984676675 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.34696313010753177, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0030525069814565397 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3551058458123904, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.00253577560262687 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.32096479784507037, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0018970324444313584 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3795245084348248, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003449429352786332 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3815645358661485, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002712452534885871 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.349200751229774, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022493473991314562 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..9e5bd4f015fcad9dd0397e45c63087c0b53dd75e --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.409501258883944, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.200735926048327 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.47359150110281645, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0035801720410154575 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.46852198178337934, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028471977217635184 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4385722344979268, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0023100736158786 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.23359678515529092, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026715948188736267 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22730491424875773, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002252917174717242 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.21297415730718317, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002002023485009685 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.36122582263536407, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0030394944731669572 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.35939795651767675, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002511542644538787 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.33437569173005427, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020107174748746504 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3998844531789924, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0033854020792017285 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3938246920292058, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002729767161367992 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.36932279359236814, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023179469576599027 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..d29a7231db794b0e443cd69d99b34a7c426b26df --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.452122590183434, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.16404160542943327 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.49497236517824444, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0035535658412753006 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4725995896409827, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028157186492877196 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.45315190664308314, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002278710461652685 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.24812095038732754, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027737064203339212 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2324345352491202, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002259923232212951 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.22316519517459477, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020371724840063865 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3745330183490656, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0030718020025572107 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3585821251012964, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024911676803155646 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34240410488312567, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020393007899216064 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4179948014646539, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0033899691757338438 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3979598039322067, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027471446794053813 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.38201002954999475, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002335148377240596 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..7945e374615404285b261b3c2fe8c8342dc5f52c --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 13.309002924662785, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.24361495936574476 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5055114743909561, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0034029405989093315 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.47439394771123267, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027085795597238727 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.46337099933680953, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022284128767927217 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2543085325831986, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026833318688377957 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.23498034253109115, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022102671857103136 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.22971317638516242, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020276942034306005 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.38203696819305627, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029643784309907667 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.35829625222003997, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002388395524420644 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3493044245188954, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020072603771810445 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4307656306766157, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003270545893660294 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4032599450584402, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026395356242984963 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.39422575829822615, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022790324609071426 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_0.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e21e656b68db8beeb44c041cd2546f486b854fcf --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.15448121328596862, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.001977188397188564 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.35997124440611034, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004298205436694583 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2118853569842521, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024831762617585746 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03645241402160218, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0011752236536019232 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.08865405071591761, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0029077149755190814 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.05056562034464029, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001595549541223809 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.11766298156431257, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.00154525669786904 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.27589374122183485, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034812956688468695 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.161553829612935, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019356026144079317 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.12262950144266513, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016994024464092056 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.28822399594677356, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003908951289350794 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1685758842303753, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002177154066590156 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.061265150562031, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.1047194903989246 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_1.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..7c067fa71319deee3b83afe1a21364efb941f8c2 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12615666366329323, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0019462075646106281 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3075463314111142, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004435681902516454 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17677552083071896, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026150769110123255 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.025631403863087567, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010195570539420784 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0643057936335091, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0025821054535310178 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.036209551359239395, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001431805409098863 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09789606233860006, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0014408570567453658 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2409666745294604, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034493105763191037 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1375227449624894, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019568848326575864 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09901294724556717, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0015797250447342009 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24365682374976821, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0037520223325616334 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13906823791458356, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002145977759148375 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4701047191488112, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.052325655561989 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_2.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..5c4185ddcdfd5ea773a78900d989501319dde5ac --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12819697138408215, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.001923900850974331 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3131959520911201, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004483015545746866 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17977482443218196, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0025982011983283434 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02774216419058187, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010191913758900069 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07049404002692027, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002708125093624563 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03935463682151496, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001450577987245735 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10245043926274368, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0014451803861143982 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.251818647068035, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003494519863990314 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14388467760513854, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019644343349970836 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09951049154417256, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0015455068687096165 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24565320812202304, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0037974977466490017 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13992101774839874, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002118355649079576 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4983004480453936, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08614156872925424 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_3.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..5ae45b6b9005a94f5449dc627b1d47ca203aa7f6 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12507167063309826, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0020654668780499437 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.29352230739872903, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0046129265452261245 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1716640710662149, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002692661486106222 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0273731792590075, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.001058152769608845 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06719512443269011, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002640278987747084 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0383031309264901, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001471824908387901 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10247899612143699, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0016344209712852228 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24201656560824256, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0037826395255217203 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1409323879677072, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.00215402254496125 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09654487009443463, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016852992800909113 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2286055088707561, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003922038940141684 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13277160506058835, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002226502076197834 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.5436814601886297, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.10599321563006747 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_4.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..5fdcc384300e0afe8a0da3591300b875d11b5072 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0429708507344084, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0028037413845202774 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.07465376472309838, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004321865151720348 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.04863969374523076, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002793420771992738 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.010519316602496626, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.001355747591263505 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.017499542584772765, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0015490170099444409 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.011395576090619692, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0010345794788431668 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0356382053447805, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.002395385288173853 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.060770117722936286, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0034770592750759917 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.039590536804712924, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0022228567744426667 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.035133893923727386, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0024011989607887903 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.059405756146875044, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003457018339558158 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0387553178144167, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0022066400343704485 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.7915506170854982, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.13278546480806505 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_5.json b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..1584ffc9072bb94b2d6a9506b9287b9b15234784 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/generation/slim.4b284b84bc4seed3_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0028705257493446055, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0008218246257449791 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0023902360458122112, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.000665569783756533 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.002544363512676877, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0007109896306856554 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.00031292391170304596, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00016477755162714296 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0002616879975370542, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00014932256088281653 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0002809498461785326, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00015434551667733464 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0021053678911906607, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0005892152083882312 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0017230940880273344, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0004664097240871752 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0018550844925242101, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0005069733094142548 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.002095488296127936, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.00060247869960542 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.001758329007481808, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0005034233459254993 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.001872065671306264, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0005341865975835362 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 7.197738308121429e-37, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 1.5261190640932973e-32 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_0.csv b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..2bf82ce112ebc535d183f05b9339400f5d02f75c --- /dev/null +++ b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.342,0.01500870618212173,0 +anli_r2,acc,0.346,0.015050266127564441,0 +anli_r3,acc,0.3408333333333333,0.013688600793296939,0 +arc_challenge,acc,0.2841296928327645,0.013179442447653886,0 +arc_challenge,acc_norm,0.29692832764505117,0.013352025976725223,0 +arc_easy,acc,0.6224747474747475,0.009947227833469435,0 +arc_easy,acc_norm,0.5437710437710438,0.01022039438372202,0 +boolq,acc,0.6165137614678899,0.008504304838837027,1 +cb,acc,0.39285714285714285,0.0658538889806635,1 +cb,f1,0.24418093983311376,,1 +copa,acc,0.78,0.04163331998932262,0 +hellaswag,acc,0.4781915952997411,0.004985032806802436,0 +hellaswag,acc_norm,0.6294562836088429,0.004819633668832535,0 +piqa,acc,0.7519042437431991,0.010077118315574719,0 +piqa,acc_norm,0.7611534276387377,0.009948120385337485,0 +rte,acc,0.5487364620938628,0.029953149241808943,0 +sciq,acc,0.848,0.011358918303475279,0 +sciq,acc_norm,0.76,0.013512312258920831,0 +storycloze_2016,acc,0.7247461250668092,0.010328538400500567,0 +winogrande,acc,0.6045777426992897,0.013741678387545348,0 diff --git a/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_0.json b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_0.json new file mode 100644 index 0000000000000000000000000000000000000000..9778e1ca5e134f5f3908a89e7dcae2f2c954436e --- /dev/null +++ b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r2": { + "acc": 0.346, + "acc_stderr": 0.015050266127564441 + }, + "anli_r3": { + "acc": 0.3408333333333333, + "acc_stderr": 0.013688600793296939 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.24418093983311376 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932262 + }, + "hellaswag": { + "acc": 0.4781915952997411, + "acc_stderr": 0.004985032806802436, + "acc_norm": 0.6294562836088429, + "acc_norm_stderr": 0.004819633668832535 + }, + "rte": { + "acc": 0.5487364620938628, + "acc_stderr": 0.029953149241808943 + }, + "winogrande": { + "acc": 0.6045777426992897, + "acc_stderr": 0.013741678387545348 + }, + "storycloze_2016": { + "acc": 0.7247461250668092, + "acc_stderr": 0.010328538400500567 + }, + "boolq": { + "acc": 0.6165137614678899, + "acc_stderr": 0.008504304838837027 + }, + "arc_easy": { + "acc": 0.6224747474747475, + "acc_stderr": 0.009947227833469435, + "acc_norm": 0.5437710437710438, + "acc_norm_stderr": 0.01022039438372202 + }, + "arc_challenge": { + "acc": 0.2841296928327645, + "acc_stderr": 0.013179442447653886, + "acc_norm": 0.29692832764505117, + "acc_norm_stderr": 0.013352025976725223 + }, + "sciq": { + "acc": 0.848, + "acc_stderr": 0.011358918303475279, + "acc_norm": 0.76, + "acc_norm_stderr": 0.013512312258920831 + }, + "piqa": { + "acc": 0.7519042437431991, + "acc_stderr": 0.010077118315574719, + "acc_norm": 0.7611534276387377, + "acc_norm_stderr": 0.009948120385337485 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_1.csv b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..a6c2ca30aee61aab4d9d044f62b8005c3d3a9b66 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.316,0.014709193056057128,0 +anli_r2,acc,0.333,0.014910846164229863,0 +anli_r3,acc,0.35,0.013774667009018554,0 +arc_challenge,acc,0.2815699658703072,0.013143376735009024,0 +arc_challenge,acc_norm,0.30802047781569963,0.013491429517292038,0 +arc_easy,acc,0.627104377104377,0.009922743197129257,0 +arc_easy,acc_norm,0.5955387205387206,0.010070746648278795,0 +boolq,acc,0.5896024464831804,0.008603488048617521,1 +cb,acc,0.30357142857142855,0.06199938655510754,1 +cb,f1,0.24554767533490937,,1 +copa,acc,0.78,0.04163331998932261,0 +hellaswag,acc,0.4780920135431189,0.004984989320648131,0 +hellaswag,acc_norm,0.6307508464449313,0.004816152074023083,0 +piqa,acc,0.7486398258977149,0.010121156016819257,0 +piqa,acc_norm,0.7611534276387377,0.009948120385337485,0 +rte,acc,0.5812274368231047,0.029696661081234824,0 +sciq,acc,0.901,0.009449248027662765,0 +sciq,acc_norm,0.884,0.010131468138756997,0 +storycloze_2016,acc,0.7188669160876536,0.010395836091628103,0 +winogrande,acc,0.5840568271507498,0.013852485356798252,0 diff --git a/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_1.json b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f7a1e05bee0353e0c5952aa36592f47872676f7d --- /dev/null +++ b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.316, + "acc_stderr": 0.014709193056057128 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.014910846164229863 + }, + "anli_r3": { + "acc": 0.35, + "acc_stderr": 0.013774667009018554 + }, + "cb": { + "acc": 0.30357142857142855, + "acc_stderr": 0.06199938655510754, + "f1": 0.24554767533490937 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932261 + }, + "hellaswag": { + "acc": 0.4780920135431189, + "acc_stderr": 0.004984989320648131, + "acc_norm": 0.6307508464449313, + "acc_norm_stderr": 0.004816152074023083 + }, + "rte": { + "acc": 0.5812274368231047, + "acc_stderr": 0.029696661081234824 + }, + "winogrande": { + "acc": 0.5840568271507498, + "acc_stderr": 0.013852485356798252 + }, + "storycloze_2016": { + "acc": 0.7188669160876536, + "acc_stderr": 0.010395836091628103 + }, + "boolq": { + "acc": 0.5896024464831804, + "acc_stderr": 0.008603488048617521 + }, + "arc_easy": { + "acc": 0.627104377104377, + "acc_stderr": 0.009922743197129257, + "acc_norm": 0.5955387205387206, + "acc_norm_stderr": 0.010070746648278795 + }, + "arc_challenge": { + "acc": 0.2815699658703072, + "acc_stderr": 0.013143376735009024, + "acc_norm": 0.30802047781569963, + "acc_norm_stderr": 0.013491429517292038 + }, + "sciq": { + "acc": 0.901, + "acc_stderr": 0.009449248027662765, + "acc_norm": 0.884, + "acc_norm_stderr": 0.010131468138756997 + }, + "piqa": { + "acc": 0.7486398258977149, + "acc_stderr": 0.010121156016819257, + "acc_norm": 0.7611534276387377, + "acc_norm_stderr": 0.009948120385337485 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_2.csv b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..6773fa79bf500f274eff30f82a0c5315ddb13699 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.335,0.014933117490932575,0 +anli_r2,acc,0.351,0.015100563798316403,0 +anli_r3,acc,0.3375,0.013655897185463658,0 +arc_challenge,acc,0.2841296928327645,0.013179442447653887,0 +arc_challenge,acc_norm,0.3199658703071672,0.013631345807016191,0 +arc_easy,acc,0.6376262626262627,0.009863468202583783,0 +arc_easy,acc_norm,0.627104377104377,0.009922743197129241,0 +boolq,acc,0.5755351681957187,0.008644688121685498,1 +cb,acc,0.32142857142857145,0.0629736228905634,1 +cb,f1,0.2819405899886936,,1 +copa,acc,0.76,0.04292346959909282,0 +hellaswag,acc,0.47629954192391954,0.004984172621822885,0 +hellaswag,acc_norm,0.6317466640111532,0.00481344861540445,0 +piqa,acc,0.750816104461371,0.010091882770120216,0 +piqa,acc_norm,0.7682263329706203,0.009845143772794048,0 +rte,acc,0.5342960288808665,0.030025579819366422,0 +sciq,acc,0.912,0.008963053962592074,0 +sciq,acc_norm,0.889,0.009938701010583726,0 +storycloze_2016,acc,0.7194013896312133,0.010389809647288827,0 +winogrande,acc,0.6069455406471981,0.013727276249108453,0 diff --git a/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_2.json b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e41fd026a52bb20d4b6a8111ec49099b1f47fe05 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.335, + "acc_stderr": 0.014933117490932575 + }, + "anli_r2": { + "acc": 0.351, + "acc_stderr": 0.015100563798316403 + }, + "anli_r3": { + "acc": 0.3375, + "acc_stderr": 0.013655897185463658 + }, + "cb": { + "acc": 0.32142857142857145, + "acc_stderr": 0.0629736228905634, + "f1": 0.2819405899886936 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909282 + }, + "hellaswag": { + "acc": 0.47629954192391954, + "acc_stderr": 0.004984172621822885, + "acc_norm": 0.6317466640111532, + "acc_norm_stderr": 0.00481344861540445 + }, + "rte": { + "acc": 0.5342960288808665, + "acc_stderr": 0.030025579819366422 + }, + "winogrande": { + "acc": 0.6069455406471981, + "acc_stderr": 0.013727276249108453 + }, + "storycloze_2016": { + "acc": 0.7194013896312133, + "acc_stderr": 0.010389809647288827 + }, + "boolq": { + "acc": 0.5755351681957187, + "acc_stderr": 0.008644688121685498 + }, + "arc_easy": { + "acc": 0.6376262626262627, + "acc_stderr": 0.009863468202583783, + "acc_norm": 0.627104377104377, + "acc_norm_stderr": 0.009922743197129241 + }, + "arc_challenge": { + "acc": 0.2841296928327645, + "acc_stderr": 0.013179442447653887, + "acc_norm": 0.3199658703071672, + "acc_norm_stderr": 0.013631345807016191 + }, + "sciq": { + "acc": 0.912, + "acc_stderr": 0.008963053962592074, + "acc_norm": 0.889, + "acc_norm_stderr": 0.009938701010583726 + }, + "piqa": { + "acc": 0.750816104461371, + "acc_stderr": 0.010091882770120216, + "acc_norm": 0.7682263329706203, + "acc_norm_stderr": 0.009845143772794048 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_3.csv b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..c6ae93b349cb85d40f2f2eecb1c2d693824c4479 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.346,0.015050266127564434,0 +anli_r2,acc,0.363,0.015213890444671281,0 +anli_r3,acc,0.3458333333333333,0.013736245342311012,0 +arc_challenge,acc,0.29948805460750855,0.013385021637313576,0 +arc_challenge,acc_norm,0.3250853242320819,0.013688147309729122,0 +arc_easy,acc,0.6397306397306397,0.009851002584732383,0 +arc_easy,acc_norm,0.627104377104377,0.009922743197129241,0 +boolq,acc,0.5740061162079511,0.008648732832949143,1 +cb,acc,0.3392857142857143,0.06384226561930827,1 +cb,f1,0.3177045177045177,,1 +copa,acc,0.83,0.03775251680686371,0 +hellaswag,acc,0.47938657637920734,0.004985539159783413,0 +hellaswag,acc_norm,0.633240390360486,0.004809352075008956,0 +piqa,acc,0.7535364526659413,0.010054810789671822,0 +piqa,acc_norm,0.7704026115342764,0.009812682950815183,0 +rte,acc,0.5523465703971119,0.02993107036293953,0 +sciq,acc,0.914,0.008870325962594766,0 +sciq,acc_norm,0.906,0.009233052000787733,0 +storycloze_2016,acc,0.729021913415286,0.010278188399635044,0 +winogrande,acc,0.6029992107340174,0.0137510925198067,0 diff --git a/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_3.json b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4c7c8a1faa0b0aa4639f737e51b5f1c0a21628d3 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.346, + "acc_stderr": 0.015050266127564434 + }, + "anli_r2": { + "acc": 0.363, + "acc_stderr": 0.015213890444671281 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.013736245342311012 + }, + "cb": { + "acc": 0.3392857142857143, + "acc_stderr": 0.06384226561930827, + "f1": 0.3177045177045177 + }, + "copa": { + "acc": 0.83, + "acc_stderr": 0.03775251680686371 + }, + "hellaswag": { + "acc": 0.47938657637920734, + "acc_stderr": 0.004985539159783413, + "acc_norm": 0.633240390360486, + "acc_norm_stderr": 0.004809352075008956 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.02993107036293953 + }, + "winogrande": { + "acc": 0.6029992107340174, + "acc_stderr": 0.0137510925198067 + }, + "storycloze_2016": { + "acc": 0.729021913415286, + "acc_stderr": 0.010278188399635044 + }, + "boolq": { + "acc": 0.5740061162079511, + "acc_stderr": 0.008648732832949143 + }, + "arc_easy": { + "acc": 0.6397306397306397, + "acc_stderr": 0.009851002584732383, + "acc_norm": 0.627104377104377, + "acc_norm_stderr": 0.009922743197129241 + }, + "arc_challenge": { + "acc": 0.29948805460750855, + "acc_stderr": 0.013385021637313576, + "acc_norm": 0.3250853242320819, + "acc_norm_stderr": 0.013688147309729122 + }, + "sciq": { + "acc": 0.914, + "acc_stderr": 0.008870325962594766, + "acc_norm": 0.906, + "acc_norm_stderr": 0.009233052000787733 + }, + "piqa": { + "acc": 0.7535364526659413, + "acc_stderr": 0.010054810789671822, + "acc_norm": 0.7704026115342764, + "acc_norm_stderr": 0.009812682950815183 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_4.csv b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..2711a2ee2ddf17083319f04cab42848fe14767c2 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.339,0.014976758771620345,0 +anli_r2,acc,0.355,0.015139491543780532,0 +anli_r3,acc,0.3333333333333333,0.013613950010225603,0 +arc_challenge,acc,0.2901023890784983,0.01326157367752077,0 +arc_challenge,acc_norm,0.3199658703071672,0.013631345807016193,0 +arc_easy,acc,0.6494107744107744,0.00979100382983156,0 +arc_easy,acc_norm,0.6279461279461279,0.009918187193096471,0 +boolq,acc,0.5620795107033639,0.008677388652709261,1 +cb,acc,0.375,0.06527912098338669,1 +cb,f1,0.3383838383838384,,1 +copa,acc,0.81,0.03942772444036623,0 +hellaswag,acc,0.475502887870942,0.0049837889926812,0 +hellaswag,acc_norm,0.6351324437363075,0.004804091708812568,0 +piqa,acc,0.7524483133841132,0.010069703966857102,0 +piqa,acc_norm,0.764417845484222,0.009901067586473885,0 +rte,acc,0.5523465703971119,0.02993107036293953,0 +sciq,acc,0.921,0.008534156773333442,0 +sciq,acc_norm,0.919,0.00863212103213998,0 +storycloze_2016,acc,0.7354355959380011,0.010200400541714165,0 +winogrande,acc,0.6006314127861089,0.013764933546717612,0 diff --git a/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_4.json b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_4.json new file mode 100644 index 0000000000000000000000000000000000000000..d83501d50acfa89185c06a1adb5f2da7144e0c41 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.339, + "acc_stderr": 0.014976758771620345 + }, + "anli_r2": { + "acc": 0.355, + "acc_stderr": 0.015139491543780532 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.013613950010225603 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.3383838383838384 + }, + "copa": { + "acc": 0.81, + "acc_stderr": 0.03942772444036623 + }, + "hellaswag": { + "acc": 0.475502887870942, + "acc_stderr": 0.0049837889926812, + "acc_norm": 0.6351324437363075, + "acc_norm_stderr": 0.004804091708812568 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.02993107036293953 + }, + "winogrande": { + "acc": 0.6006314127861089, + "acc_stderr": 0.013764933546717612 + }, + "storycloze_2016": { + "acc": 0.7354355959380011, + "acc_stderr": 0.010200400541714165 + }, + "boolq": { + "acc": 0.5620795107033639, + "acc_stderr": 0.008677388652709261 + }, + "arc_easy": { + "acc": 0.6494107744107744, + "acc_stderr": 0.00979100382983156, + "acc_norm": 0.6279461279461279, + "acc_norm_stderr": 0.009918187193096471 + }, + "arc_challenge": { + "acc": 0.2901023890784983, + "acc_stderr": 0.01326157367752077, + "acc_norm": 0.3199658703071672, + "acc_norm_stderr": 0.013631345807016193 + }, + "sciq": { + "acc": 0.921, + "acc_stderr": 0.008534156773333442, + "acc_norm": 0.919, + "acc_norm_stderr": 0.00863212103213998 + }, + "piqa": { + "acc": 0.7524483133841132, + "acc_stderr": 0.010069703966857102, + "acc_norm": 0.764417845484222, + "acc_norm_stderr": 0.009901067586473885 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_5.csv b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..4288d046a1cff0074249ccf3b2b57d40cd17d973 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.328,0.014853842487270334,0 +anli_r2,acc,0.348,0.01507060460376841,0 +anli_r3,acc,0.34833333333333333,0.013759437498874072,0 +arc_challenge,acc,0.28924914675767915,0.013250012579393443,0 +arc_challenge,acc_norm,0.3242320819112628,0.013678810399518815,0 +arc_easy,acc,0.6464646464646465,0.009809728948151492,0 +arc_easy,acc_norm,0.6317340067340067,0.009897286209010888,0 +boolq,acc,0.5776758409785933,0.008638883260317736,1 +cb,acc,0.375,0.06527912098338669,1 +cb,f1,0.32619912953739855,,1 +copa,acc,0.8,0.04020151261036844,0 +hellaswag,acc,0.4765982871937861,0.004984313205791442,0 +hellaswag,acc_norm,0.6382194781915953,0.00479533700911818,0 +piqa,acc,0.750272034820457,0.010099232969867486,0 +piqa,acc_norm,0.7611534276387377,0.009948120385337484,0 +rte,acc,0.5740072202166066,0.02976495674177765,0 +sciq,acc,0.925,0.00833333333333336,0 +sciq,acc_norm,0.921,0.008534156773333443,0 +storycloze_2016,acc,0.726349545697488,0.010309797094497109,0 +winogrande,acc,0.6022099447513812,0.013755743513749027,0 diff --git a/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_5.json b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_5.json new file mode 100644 index 0000000000000000000000000000000000000000..0dabac4ef7447b4ad241164c57eed68866e72c25 --- /dev/null +++ b/4b284b84bc4seed3/evaluation/rankeval/4b284b84bc4seed3_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270334 + }, + "anli_r2": { + "acc": 0.348, + "acc_stderr": 0.01507060460376841 + }, + "anli_r3": { + "acc": 0.34833333333333333, + "acc_stderr": 0.013759437498874072 + }, + "cb": { + "acc": 0.375, + "acc_stderr": 0.06527912098338669, + "f1": 0.32619912953739855 + }, + "copa": { + "acc": 0.8, + "acc_stderr": 0.04020151261036844 + }, + "hellaswag": { + "acc": 0.4765982871937861, + "acc_stderr": 0.004984313205791442, + "acc_norm": 0.6382194781915953, + "acc_norm_stderr": 0.00479533700911818 + }, + "rte": { + "acc": 0.5740072202166066, + "acc_stderr": 0.02976495674177765 + }, + "winogrande": { + "acc": 0.6022099447513812, + "acc_stderr": 0.013755743513749027 + }, + "storycloze_2016": { + "acc": 0.726349545697488, + "acc_stderr": 0.010309797094497109 + }, + "boolq": { + "acc": 0.5776758409785933, + "acc_stderr": 0.008638883260317736 + }, + "arc_easy": { + "acc": 0.6464646464646465, + "acc_stderr": 0.009809728948151492, + "acc_norm": 0.6317340067340067, + "acc_norm_stderr": 0.009897286209010888 + }, + "arc_challenge": { + "acc": 0.28924914675767915, + "acc_stderr": 0.013250012579393443, + "acc_norm": 0.3242320819112628, + "acc_norm_stderr": 0.013678810399518815 + }, + "sciq": { + "acc": 0.925, + "acc_stderr": 0.00833333333333336, + "acc_norm": 0.921, + "acc_norm_stderr": 0.008534156773333443 + }, + "piqa": { + "acc": 0.750272034820457, + "acc_stderr": 0.010099232969867486, + "acc_norm": 0.7611534276387377, + "acc_norm_stderr": 0.009948120385337484 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..571fdcbf6e19f26937860f44604b4e1d6871c7dc --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e96742ede50e51d12935b7b59bee68eb57e8ac8f02fac548dcfcca1fc09e6a80 +size 199058647 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5e18039c8084d6ef71c0f515690711bd4132fc1 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3866b6735a9f4852f9d96dbd1a24cddd436dd055c945791abcc48d981e7449b7 +size 199058647 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb28e9b3899d561a53336db64874890e4a78ff88 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50c72ba9e8e8fa33162c37615ec60bfcae9b19d7c327ba0ab1fae7dee67f6b7f +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cba0f083b4b422755fb1ab50da48eef88e01d445 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8d2792ad1bef3ee7288fe535ec54a58aa5deccb88dedf9a9119312f247b3cb9 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0cb7a9151d8491aada7d8b5e8dd15e38206a663 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c8e264a49a255d7e04fcba3f268c7910a1442205cc074e603538976f3b926c8 +size 199058797 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7603b755fbb0aa930a6fefff39b1158730c193a1 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23c742ec91e75e2b72d2bd361e5584b98abc2ceba890e0bafe8249d5aa112221 +size 199058797 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..436b16dfb8caf32829e3f1b3b1e6d82277fbac5a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf2f3a3f9202e75ffd5c0dcd6780e7c937370a2d6a8187819c8232c45a55ec36 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c45dba5805deb396ac285bc7ba478ec7b6f88b03 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76b973cfe1f12e6b5b8083b09f15e9ff1cac9619943c82a1d61a1591a01f0651 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9445d37523fe9f6e45cfd12b65c90cf8d3f8fa3 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de3015caacdfaea928eb32119f0326e6e810c5d714c42b0f5270a11969cfd89a +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63a4da6a3f1ca1291a73580ca54dbed5750a7005 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2a87bce4d5777708bbb320a3c1508d7450481d1d88aebf51f980a031460f3e7 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3520559ae30f526eb913a65ca7c9e1f5094c0d8b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cffda5f79370026482c36ab3fde7597d062560339bebb70ccd11cd8ebd2f53e5 +size 199058797 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c1125b331d142701cc3fc05326feafca469563c --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7520ee982f26227e15da7bf7c419c185f4ddd48c786367d48783325d0ae12bab +size 199058797 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b02ba824a5c984d9af122a06d8ba9e8bd75089b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b196f007936eb6c7d9ec7b1c3e0f27a2641017c4534c7e519a12a7feb7e4db0f +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12fd4ce1c744390ed40bb3b505e80fe2828c0389 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4524f842719063f1f93c32c5f1c1f51c397a31ebfc37e6d2b74c4f2c144bed57 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..736ccb9938f98ab5bd0b70f16b52132723030980 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7884e2609d21ca9852e44c8bf954f51e0726c451690a020834f9548f498656eb +size 199058669 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..840e3042e330a017b6955fad57b5647bcc249812 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45c71febf4167bfca1e1abcde388aa070e4267cfc78508d13c23e98f7a3428de +size 199058669 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..568fd7c0039ced83ee8e1b630005dfe6f4582657 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c8e0e1e261648b886c2f74d3133d098b94448b9c982175ff57cc8eecdb819b0 +size 199058797 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a20e767af470b75839f036e1d5cf8dc029b83e31 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11d7a1710ebae585a6f1c6e91d3fb57ea93f74719e0076cd1583f3fde7e39613 +size 199058797 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdc9b708678da3bb082029ff79747197c396b72b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c57e5b0fa0602502bb671c5ddf30e593e8cf84a6f1f47b1bec6d1577b7591730 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..876e48994eb0e801b78ea746e9e498cd8fb640a8 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed37df1220afd88ec59c9aede234e3bd9764bfff88684a98503301024f3290fd +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f24b4d8c24a93f02ee1f8626369e7900c8685e10 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:360f2b751be127c3dda9b1a060c02d900b77f3b50de3b85c6be41881b0c74dd2 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd1b3e1ae294a2dcf0d02651a2317def2e08ba91 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23eac40246b032ef511b5733bd3d0d3f43140c435992e06a5b4f679c96880aa9 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05c1f370e7d79c2126cb9354761a8641952ccd64 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8f0a851466dc5bb0bf945a67ad22608cf21ff1d16a55bf7e412f98a83f51a62 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5062aaf4742a97a708a8dd3f0a025a4eb3f760e9 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:144beb989d323273980862359be423ab9372464fb1797465370f2555ba1608a4 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e5ff40a0ebdf373e238e97a5af3a1566b770171 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2ba03bfbf4cd8de162c497326893434f8b90799f545180a7d53fb92c43590c2 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf400ee08724f0b6aff6570f6690107c3220a1af --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93963d642333760b4bfcbbbd2579531166e98e83454a682762b74bfae3680d7c +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba69471fa299ef7e738180467a38229e6aa2de17 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6394f62dcd2c5a120d669046d08cff7dc9f08fd22718452ba73d35714e837d7c +size 199058797 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..866d7eca8aea6b447c0bf4ba1812db7ee15ce655 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87fea36db07bc6173156dc45c62a0c4298e383cb909ce74a30960e414555345c +size 199058797 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..486a85bd9ad964f4d6f48777722ea45425bfed3b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b235c0d695a06a8a5eaa75714c98ed0622005c79e7ff90d63e20f3b106af2d7a +size 199058605 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c6163fbda24edcac13bb7ea4c4991fb52d58ea7 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48011dfdb9dd6f453a98bb99947f84cb0880dfa3556f9916af4d8a0e115d931f +size 199058605 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25c3ce69c3e55991d021d761387c9aeb0cfef542 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2278d795c1c23e1c0f4fb579380d0ed7f4b22949f1f997eef5c24574424012f +size 199058669 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf43814ae4d880f6033f0340ba1321263003ea1b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09a4e7d84ea94aa05f377c4998e4468aa0727fcfd00dada58df131413543567c +size 199058669 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a95c55718cfd87083378268eb11d650087800e20 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94be921faea37128feb8332fa208e64377afc1c418859f5c2cf7f65ccec6dc47 +size 199058797 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9bd559f5522870200fbee74dc02e2d74c7beb7c --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fa559ca63c7ab6f037918361fd25a353c4b255a8647a409ba11944e7412477a +size 199058797 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7574942b26d6705b0a8f19e6ebeac153224969fc --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8808185db9c7aaea90d119515f9d3b1aca5a2133cf2ff50d8b40eed2a779a121 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..faabc6a9114f86acda29b8da4f29cffabbb2068f --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce4027b36b89ebffb729c9a92e7bb4327e0b4adf13f237d6ff294dd0ae3b62be +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce54db440128a5ccc1e1b26b5154cf7d7e23e3ba --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de008bed5551d8441662191300fd6a7286513213520d149c345aadf8b792ff14 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ebc2d6f0c59812db19310e991808e551ecedecd --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a70905212d10f659d888e1c33e821af788b618516f5fbc708e0c94791e19168 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..877240af45b22a704ff3d08cebe450b1dcca5158 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9e709929dc0e504afd50d48435e09ac94565c4140a6d54f6a28bc6a0a4b0f86 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2415dca78df11a659cab93c635d80d826691b9b1 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e8e8286e867d0bccb98aa7407cc605fe1b68f076e9b9ef693915cc3d105a842 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e63a1192ba64a024b414ae2cf4bd5b4bd7758ffb --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f6dc3a62f3a614cf18b08fa0ea39d645e3c766b24ef7e653ac71ceef05bf92b +size 199058797 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f55a061e36aa4411c4e248d08bd13df7b58c47a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7351788724cee2faf831363635751aac154da0d3000a148273b423fdce47af13 +size 199058797 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0f94bef21f299419321a9a3703dbd2b501a4456 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4960bc6b400f505ad0024e4142eebe4b9c2d831df7ede64c6035a968a599b39 +size 199058669 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d092e3dc666c455509ba79b539bfa72a0c475d2a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ea3fe55838cce11cb512c11063bde9c24074389e8c864cfe51118263a10235c +size 199058669 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2eedbe1e15f58b793d6b0f687fedaf214bcaab4 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aea779fbdc19d8ca78ba3b7932b4f702509007a9de8838d91e46657cee97f40e +size 199058850 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a77c5763475f1a688517f3199758b0e682da326 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea7047256712d77be708eed7965a18a90ba2d50422079d64c5652d9614a3a2ad +size 199058850 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2c7285f679fb63dad22ba52b9b2c3ef731c33be --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c35bdcd161ccc86cd1362826ea3e095dcb84b375813e7879179d6791da244beb +size 199058669 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fca6257eede72a8b92db6f9d9a6ee4a4186ca2a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:527bcc9be0116ba0e54cc86d9fa40d3540bb9d1cf9ab92706a4591ebc162be8c +size 199058669 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a27befe6d859b36db6de1baac1258e8658b2488c --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337220d40722cc3e0c4ce0a08bc5f56cf9c43d3dfb1e75f53f9d1477218dd7fa +size 199058797 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b2b3e09f0514f8a7c286ff9cfd8527b1f8b7cb5 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3dd99ec4302a7f345d3fcd4f1efd3ff9cb26fbf966da5ed373c73df5adb829e +size 199058797 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ebfd27032f1a7806d01271861273905a32c232c --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d32bfd691f15f78df470672a6bf34e5a9e7b6e7b4afa54a35247d1a29c0964f9 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0de3757cd74616688906e1f3b67a8a6856ade075 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc943bba080f8da746562c555ff9571cb53830a087cff65a0379b9ef39e33f43 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbcdf133884aecf0c78260398c409fae3a49cba0 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a2f557f55e369d5f2286c48c5e0e21aae5ba036538c9c749f16b10728e2bd6a +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2e7294bc188e563370ff4e51a62a465d33fe6f5 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0de7328619294eebbac861b5f9030d0058000b2b38fa4f2a7aa6734acb50546 +size 199058733 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf927e3a6d2027b4014ec929a43b3963f57df721 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53e1362f57e4e77015eebce478f6fe16ff04e46fa3de3344babff3472af22000 +size 199058669 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09af1b8ac140bbc8f6e6b77be57b99b25d127062 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebd75c0b9135eb2a10dc9a9ea69cf39e24d8306cb91749e41ab2877465e5ccc2 +size 199058669 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76a2c6f896f936abd160a2b3b7a6e61fe23da9da --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b00416991096972c973a12b71690c9aa21c3b86650e0ffb8e6e76756ba961f5 +size 199058925 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ed7fc0c12076319390fbf8635fd4d5c9888ae0f --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bb4fc2145fd3d6815b79cfe1d3502dc8dad7fa861867cbebdcd070205464196 +size 199058925 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0c8dff09e96b1439494e6bc262f98e9116c1c5c --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f09027b6b61cf1364913d82a2c494727d91a88e5c90bbd6eda4dbac6654387cf +size 199058605 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3feb07ed4048617771cd0d67a7a865aecfdfad1 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04fcddf92dc049f09e1f75ae01a5b375f2f34f601af3ad1dcf7ca0c5fd3c1930 +size 199058605 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0d3f67c76be3e05289c5cf42e11a14faf3c852b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82502fe89ec6cc8cd532a0088f0d86608ccc75a9ff6dd4860d1d27fe8832a53c +size 199058605 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b4c085ea9c8e7757a0f5730ee716ab56bb09ef1 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:123436c127b3f4a75578975d56d8cc9e74c4a0161d3cb5d359ef2c8cb61f40ae +size 199058605 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aabd3269e80991f62593f5716486aa306a4611bf --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f19a5de33b957a139bb96674f2521821210d22f2a9a2ce869970bf826033200d +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f365a4c9d4c3c54f590fb161cf751d7a7203c8a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:909012364cddeedf210ab92c37e203b0ece9b8df77bf5a66858db1bb63232156 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8742eda60259b268d6ae52d65e448ec4dbf0b3b6 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e81456eaa4089c3b3bca793df36a6e0be3218485e2d8cced766c65513486b83 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2908e8f115f97d4a281badca9f09d22c91e3415a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d808d886460793c5c6c537e8d6db9aebbb8ae078fe3de42814e6d14cd8babcc3 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f89f56feda26668d1b6a71c67adea4423caa826 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00c34a35780f46b39c33cd18f183791698120158f5dcd862272735c2b5e17db1 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad66a280f38cbedb7f45989967b96dc162ea2afb --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6073c9175bf700f65a732565048f1b8a96d9e64bee1c649b065e265b710240cd +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9df66d3f0043434117a8063c4b859c41c7a6eff7 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d1f546cd82e211c05df8360fddb433887f48d5877cd8ae951b1ae39a899ded8 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bfe7da56a612ed16bfbe4ad89651e01a3832c77 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9c3c1033bf96427773e9173bb877693f4e756e6680ddaa3f87571934ecb9c0c +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4ee072ae4d7b25b67e36155dc32bbf80f4c1787 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ec6bc69cc1e8795a449d4dc97ae08577006597b44cc9bfc308c6642b2dea33f +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..beca6e4b4ac1441724939964273504eec1986aa2 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb1e4b7d097d774061f5da370046925022b1eb190f7250e3b608ad7eaca92f3b +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b5a11e171d216683346a0177f3311f154230055 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d25e5cff100af4052a3bfb27fef5ee6190c8470f54c979650dd406bd05692057 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5672b6fb06be4675ff4f098942bd350faad326d0 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f24818abc2a77e9ef620178891c21347f761099e5a93ff4f42fbd3af35ccc7e7 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..960bbe8089be816dd0d66d2c785074d40a73ad70 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27e6b42fa6a3d6ef8aa3ce5fc71c7167261b75fb4c61163d1605c714d3db3808 +size 199058978 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9527d5a3f06cf97bf3f0c6202080d2e408f4458 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:710360ccec2e5adeb4b95e448af848b7a0bbcc59b8ae0e8e7aa16c6b9170f862 +size 199058978 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68c270e8eaa93e67e1fcd549196a1dbe13dc2a3c --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b72bb6fa07abe33a435ac8a0e015d94e5c337fa1171913d0dec9842fd44260a2 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..683dac57009050b7afbdd70f0df32cda5a0065bf --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2238dc7769bac982ac535c5360784d370d54f547942d59a04cd4df39df7b8b72 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95ab1fb50ab3c5d6ab9acd8730f63cf468551e3e --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c4ae74c5f68d53a2ac5d26c9837a480ad7bf1119d442fbc1961917f7d8924f1 +size 199058647 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1faf326e0b2a5c5a1bba71fef8c453cc99d19c8a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:712ecc72324f3143a0c167b64bc62ae901c1794bbaa6c5b9d754b2e42c6eac18 +size 199058647 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51ca96296a3787cafc237c998dcab25e2467902a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef4a661294391831bdd592d7aa805ac221cd357f4804258385f9767c11938a90 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47b3aa8a3af66bb80ab421fc9b14cd286ceff415 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39b046783a37b01648953076011578d54025a54824dbd8f68ba2c018c3a0934e +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b524475ef31f6bff997d6e22391010ef2ef682e --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae403fb2fa579c7b4c4cf35855ab98803bfff7b3217906e51c7e9a144413ec4 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f99e18073b52a98f5a10975b040890d3fcd78d57 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a939bd07d240803529dbccd4d6b23f642883c32714906425cf32ebded678e195 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f200a2da030579919d5fdbc84b93c987dc1f65e --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:231d2da2f8b1e91bb6859895a8173e72e95411451c43094718854969489a726d +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95dfdaa5101955f21200f850a0660c025ca1ba49 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6757c299b890e005612363ad6abfddb8cb975e57df3e73a3670b12c7da03334 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf84a89fb1ec0ce7d111c74c83c149aff0095ddb --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e6e9f6a4607108962b8e56f49acaf25112991f6ed8d62eff1a30d543990e97c +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db5d49052e65227a6d56a6083e907402c796dc8e --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc68a01e7c66c9885c2d1115032214076c93577f5570c13bda4cab4e5bae4d50 +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..459fbedc236132153e719648a4cbc8efdeb4fe8e --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2934dbafdbe502336147f9c9a11d75cd2050bfbb68ec74b66e453c95492134d9 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec1a55185df8181655d388fd5275e0e93ca3c4f6 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dca7dbba5b2c3db8b0ace12bc4fe35804553cb29ae2f723b9b91daf9e641163d +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3eca30b3fe36dac26b0f65791614e69bd98bb317 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:131a82d56facb05a0318a8f3e2fb28e3ce170fea4810a57f96d330e34b614b7b +size 199058850 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4eff9a792ac900b386a570c9a9afc276fbb53533 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a897d12db58a84fa1e23643de3b09fb82c778b80242defda4e77cd73be65cc2 +size 199058850 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bba81ce2725d7840a3cc86e137854ff4f91c466 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a055dcfa3efe4e8ed0623682927344b16af023fc553dd05a397f3b91abaf9acf +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea3527f0d9d78545699058d11d87314d9ab9c480 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23058e699ec02f33b49e77408aaee63191a42b3e977a14f0b00870bcb74ff24d +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..025d6205d5ea28c824feab6c0078f2624cc670fc --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8054f2e705728af71fc07ec03f9d9098c3421ab19089ae25bc82570c24fa76d9 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4105a86f4ef257c99c84f76128fae96e0eca16be --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73ecefb38d5d3e60b445b2269c86698c3625ffd6fc43ff53429ecd24150ead48 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d7daf3188676dcd3963d972470302ff6b22f888 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d83a8b1395664e1724662568840b0723c43cc76acc3e10477118dd574334a210 +size 199058594 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e36d69a9678a901f76e71bd55785371127c4e73 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f27e9d384861952efa1b33a8d7415f72de15b97684e866d6b4b547d7c5d83a +size 199058594 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a32e2e7ae40abdef76c9260324e2806d0675aca --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b829106bd4b2755b740d308526be11a1f13ab13fee1229f82a5e89a50cd46e86 +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34c0bd41ebcad606a3244360fb3ae64619450fdd --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:434211d76056ea2ada24a8e7bb14d0f509bd467c2b8076362b2a4738c8d44a06 +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e469fb773594ae46bb27d7f80047e360b4e2c5f --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10b8cea238e2e41a394ea3e1f50c34ff2021518b0e177cc5d2b60c4bf7deff72 +size 199058711 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16719390f0da288a1fe2915542461eb84f60be96 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df66c4ea82ea3637aaa547498dafb5970655c4b8be204cd3e8664902fa3f9d68 +size 199058711 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b49c6df862e1bdbae45b1a12c45daff2c0ba4138 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ac14925c7f7780f01c18adce6ac95089a0738391a898dbb4debf7442b359156 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f761433acaa191d02af2f6110133f7433eb74009 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb5831eedd868c50823951cf1faf90d61398221332a5e16b43ef3155cdc70a19 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..302c4b13dd27cceb0ae8b1eac46af7d6e11f7234 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23c16487a0ce6aa407b54f8d85a21a67dc0700130ef01c26682909eab4b720d0 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..257b08a919033a6799008c557bf8dae3d64b0fdc --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27b4d67f6868fcc386d347078cd9b0feeaefb977a0d8df2fd5045b7b03455599 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb5da6b25b8cc0e354bd120f2c1205efa200670d --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:265688d0a1ba5606a36dfef48b65386fa895a6cb86535b03c7a7a05d0f7eceba +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..966cd30f1c6a9c00227e35716eefe8f6be0f197c --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31771eeb2a83cb182eb0aa738dab5538f10372303ca226d37fde69a69e883a9d +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f835bbbb548137cde21dbbe354310de139a8f48 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bef4988b312d0d750e0079d1008ef5750d5f3454da19af7e18977a88568e9e08 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..257e0c161c2fb155f62773084da78d42f5de44ed --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67f706a17478502537a4e391f02118393be87d4a7467fa4761be8f0fcef6bb4c +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a31db4f1f7e6eded6476031ea39259a42a089c71 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dc1e8963923a780ba69cd134b1937624e817b98a4d38072cc9e4a048fc59756 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab911f54cb83b6905dc675a99c2f3bcbbe7d65ef --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46926b1ebfedc76952f7443d11633a6eaf22bcf2d490784b924f98cbe3484bda +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..259b2c707d4d21186fe819593ad23f278e0d5c05 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a4d590a5a6d90bd0b38eb26e3870b3166cefb7de48292b3304ce362b4ab7463 +size 199058594 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..037b6dec65d58a4d8268627940c3bfc7c8ae2a04 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c4fe24053651b8ef29d826eb32455fe05bef58509dc0c06b66202bfc3c3ad93 +size 199058594 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1b320ce06580553eb9554f13bf30a2561ae6ff7 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c532658e997c82465526fe195df3396a9be551998352c41693d4d013ecb3796 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d85d04e534283a1d9612ba683bf46624013c723b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d84d9a5ffb92b1e63d2af4a26d8ba80c73dc640663e7a4e140aba5b79f8f4264 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b260422e1409a4869b0c760b4051eab0ee37dfa2 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c36e01e5ba77506d99cf00cdd4d0aa9e433c1acf1851174822ea05c9fb458f8a +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9180691fa7099c76b594c87390dbb2c893529453 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bef4a5dd2cba1980ccbe8b72112d400a020f4af4342e83cab24a59db368f7c1f +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7415898be6035ff69b4133ff15023bb98d1ee82 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a5658a77ba4db1ba259bb57e70a46cedb5c38ee9749b4bc0c8f627bff32e96f +size 199058850 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22f235916aca042f6d764d90600decdfcc92853b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b92186ef23ec8a07216830b339919f9cebf95e457deaf3428a96093cde7f4ea +size 199058850 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07b442b1dc18b9e39f8d81ec00cc7e48992ca399 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c364b8810483e67dea0e858f3c3ceb8d3758019133b4d6c0854d8fd2a28f70f +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0402961810f67a6c7ab51d399492b7272b2ea190 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c24dd2a805c57f0ed5e84c6174381d18f2be2fc262266045f7e481a7aada8cb9 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8de621498ce4b5313baefdead653fe2e1d9f7870 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a5f815a343557856c9c2dfb43bd8f71a262809f6de42a604010bba75bd49565 +size 199058647 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14177bf3889c940727aba6f06e4089bea3dfca23 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:515d2e38e1d6bd6520fe2f6ed529a73297b6bff86a4bc7a9846030c7b22eaaf9 +size 199058647 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2e7601db4d0457054801cfb863c88fa0dcfc2ed --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aff6b05b12af0c8825024ef9b753ae3ff307225a63c1e00f09ad83f15f1ac118 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dc18118bceb40d7481a837a63737bf166467f6a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edfd532d66ac9243cd5a22ba041c8ec95ca1aa6e97c9bf05c6b3686750b75c39 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17af509d239b80d89edfcd4849dc0f04ec8b9525 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd687d868e6582ef2230ecfa3d77583ccd290a44f9aaa61ea02234e3361de932 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f922bdb4f366d0abf063fbc3ce92874b5a6ff9c1 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f06d596aac92cdfcf6e18a97fd23843605bb512dc596c44ce20db9814283495 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d84821ea849735c34c89c1f5afaa83ae9af885cb --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:accc6d542ad7f678665e9acd60942489904b3c9902836883f756828c68a2d30f +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0e0bb34ba77227d09b8bfa46118f718f5bf0a9a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ad066f26523591c2c788bd13b17997c8ba72474cedb49c34cce6d55d14bae87 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af7b692902dd76c1af7d72434a8e2ae01a7987d3 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d02139bd50b2e4081e8e172d816c4d02c7351192cc4ff61514f66ffc0970556f +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b020911135cd7894cd5cd84f1717ab9103a953b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afb77e2523b50bec1c9b96a8591b8cf737d944d4afcd9dea3fd4ff5ba96a6e1a +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c11ac5a2242f0409ea3e4ce7a6e7d8791ed0418 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:650f4bf96d4cc62e98ef35649c731a0f1d437d37a2d39cb229effa94c303799e +size 199058850 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba462c07b64d7681b89069dcaa659c382a2222c5 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63f3a0f75ff5c1e75b63ecb0bd2bd47f52fe492bbab278a3bd177d0961be9678 +size 199058850 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c44daa86c9cdc652523e0c4cc22c4af4b0eaa844 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2176c2388b3e5917cbfe6ceb9a51ff8bac78024fd837fd111bd0ac7e39be2f22 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc70c2534a4e65960e0ab051c565763e4f885140 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8675b98cdc00c6bc654a3384fb373f29659ebe5b5216dffde0459d7dd96bb949 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b24eed8478949bd3b15a0c436573aa396e0b4b8d --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73fee97e3d2eccc8ab5f7cbae43b562998feb26a72a4d21281a1020458bfa6f1 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f12099b4a201c32959c3503569f682547414afc --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afa8bcf368729546de9b045255b058370d2eaf656e913a942f55a3802802deb6 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1103dbe58e37bf86e00cc03050e58ae20c3b7c6 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49556c5136a47cca2f831cd5f70ba184f80aab337637175b9b7c2b751ca56110 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8325d5858ad782c0d5f7f88387ff16c8b83c3deb --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dce00a61c89c4e5d7a3f7b9d6884cd36c23d6bfb0b22243c825d48ddab91456a +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f8b635a9011cedd25514db102d55be828ad1965 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d02df839bc88eb5e2ad8193ebf4107bca66b3d7dbf07a87a19479b875abe07bd +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f928e4d1e867ca14e69e98ca8915964ac13272cf --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a2ac84b5fb23bd1008c260c33075c47d8a0d654642e571b294e19d5c27b45eb +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b73f3894694371e1c8a1ae45c83e9db8c3ce9b0e --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cfa805c2ea1f7cdd04623dd4e98d2393e185f120d18a802406b828c84152c5e +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2726b4283bee3703c9b380afab33940843269f1b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8244cdec6dedf8029bd137908a6b5f73eb28f9a70b21b3ecf98afd5c9aec0fe3 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..402dae0b79fbc787ec5540a335a30e1b47118335 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55322f260ef1137e206dfd3720543c398684dcc6995b3c5df73ebdd169d3db65 +size 199058775 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3cb72e1b05aaaeef200305a149506eac9bdd419 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8982c331b25129db87b2af59b6239aa1aea3447cf8796ae5fe37ab0c3fa7c9bd +size 199058775 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0d9730ead4f7257d82dedff527d725b70fb2690 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79e0ce6ddae2a8a1a447398b0c1cb332b952e3bbc73d655c879c876bc8a237c5 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16abac71fb85f6d9d37f5de44adcb3287a60cebc --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:941598835f395811627c64c3f1ac8a5c26ebe20662d4f5ae39021870ff73a579 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..734caa14640aafba098fbb08dfaec3aaaa95d8c6 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b7aa8c2f06c925d104ef6291649ef95dbc979087fef69612542f5023b86d138 +size 199058850 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55a56190c4efe2da38a9a870cf58582bc2d64a8b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b047579fdaa3d5a989fb98eee90134fce20b83462db0b6bedb39f43e1196b40 +size 199058850 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b95f809b16edb3ca945f7cdc87c800813c04f0b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ffc58b2d4c7fea49d4ef06a2a0daaa7160f1c3f86a72418c997701cb42e530b +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4917b2dc5f99c2adc302c4f8c429bb61958ca5b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d65a866a1ee56f1b157868a745a9a8409234fabb439b74e534802d2b041bef52 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d80a9f7a445c14a6816b99c22dcab66b90e7398 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bd01c3d70570a9c98148365a4ddadcc06b77567103755315c18830491d10fbb +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccbbe5ea2ea64394947280f62ea16bfb27a99285 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c50b4a775507fe19d89465f2c73c59bd113f30e17867f9bb36a38b35a34f5a9a +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ed02a2bc0ac38c90617846ccdcfa88d4acc71d9 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b26bb4bb0be9aa06da43512d80ec5d657aa967d81710142bbf140bc038a8a28 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a255d695233faf2e44855074d77d0ff2b888f1d --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c810ea0b55a014133e54c456a5ae88a1f638880015c918de8aa4856ecc14a2f6 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5583b52acf0e7664805b94063bac49d7f37b452b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0695a9538cdd10807865f4c248c2672741fbc3d4115b89aa232a78f06de5c563 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b05e0d5f039af5e3113789842bb5f05ddd06ab5 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12ea0e01914ddabdee234d2a821ddf65eb6b25d832827d404bd0706e0e13a9e5 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64b2da25cad985ee0b74439d1b900f70cef37931 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f184c44f58efba4b4f8aad768d0068983c280a788ea34e324172bdc5553074d3 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46ce5d6e78a20482b8098132c95e968bd943bbce --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9f1a1f9a3b6299059820b23a77ff944d839f2b6e4f18adaf3da0f2a2b1cfab7 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1520f578131885e38f25d53f759bf55aed59217b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:058e908714bb1bdea8d4c237fa0b034b57df6b11fcf871cfb2542f630302d483 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2182dc01c4635da31e31b72cfea8d291326e7e3a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cea055f080fcf3c421b78cf5f171558a223c2aadd84b47bb26ce23d80782fbfb +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..180a3b37375cf5fbd29986e2105d4217fe05bb05 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:786f4ee016a534cc1ebf2fbe531a5b4863fb119b67e3a8b345db6ec069302776 +size 199058914 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09551653b52bc03688e4c8605c55725aa7a54675 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d0a3b0e3d6b66e558f07d9216ec83eec69f4999acd1ba5ff0b5236433e29b2c +size 199058914 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aacd2bf976ed0cff520d9a15fe694290bd3c2591 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4623e0ce4ea6e6336b0f3d34528638a1fb94121cc62ea7850f23d3939b57206b +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0fdd25705ca1cc8dcfa31750d92b0e3200d6078 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:469409680613c7c63aad270d1f99a12f7c50d0c7dc07a9a15d508742b6fb1187 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54f279a9bc6904602325c9effa96b613740dfdea --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab716c96a5d03565e9da3888bc8aee2fded177ecae75a48e4b48839f37f081f3 +size 199058711 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb72deec0fce0dec03a4817c417fdf1481964bf6 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24bf1ac89999b8fcb75b30a01d8f64538c1cec607e2f3e2ab15d6a58000cecd7 +size 199058711 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59da7f5ad115f892a995d2d764cf810e607706ee --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:205a1dca980411805546b3b63357f7940ea522f7b102655c73de66fd10607733 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a370feb9a3a316ba1e3aae26389061148b314db3 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29c8bf77c487a155f899769b74e012c218897a58e7228380076720e46019654d +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26b1b638351498c82c2f16a05541023e91b3d324 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10791885bf7b7c4e76d6ae83d3aab424711b138e658046b7e8b314fd5bb80017 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47ae04ccf4f9599add8f1003a27dd96eed439915 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a55f1164acde69365519a75a605eaea25db2ea650726568bdb55f526aa6365c +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c24055284077976780e62928960071030b6b798c --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eff3d7fd32b9e4f2fc0d92ce8374a859b5b2c3f2da497dd81c9e2109a41238ee +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e23356c8008e6353e5223f58def3d88e90ec8e50 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c38a354421c1761d7616abfa15533b637715065781ab3d735366716b9347bed +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c66cc0d37985eb4338c6b402880d07a1f2fd858 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:701a1b83e8e7ab169eca8d421d38c635b1e446ce32a651cb879d1835a7672e5b +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d38bd48fbdeacf75cc97b5e44cd774cae96042d --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c755e3a410030bfbfcd09e369e241748688e4f2ae6d417db7307b8cfbe9c07cb +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..668d949f4b1f8f6da8beba54c48d2a8b68194f38 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f60192ee58c4974dbeaa40802733d14c7d3ce3180218d1ff896d0e24449273fb +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96fddc5533d11582aa96b508ca1e5f762a9595ae --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed6360db22de503ebd0d29bbf549309fbfcbdc82f568f63dcbb7314373cc948a +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..696d3cc2fae4071122ce8eb531b2f937f0d83b04 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10ef54e8115378b2f78546271b5a3b4bc291d5b6b4290cdf82211d7c60c71362 +size 199058850 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f56c423a4691d52f91d7d84bf6892c0b3f5a8610 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c3dfa03d171c8d57ba1af94fecf210df87de08f08c67bc7d7c3148f48b65c86 +size 199058850 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81e896a53769ea7b4f9d830b157000a0c0cd6065 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8fada506a32c5adf2c0b56e608c8bebbb0d9bfab428d864c481437bd2bb623c +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd268aa295db56a84906000fab7ea17e556da165 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:713370979524344a7e4460cf16fdb757a3f613ec3d38409c777f3c0bd54a72c3 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..471abe7dbd08ba907e28512baf5b298bf61ab227 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6c7d2dd2c44c0a88e7aeac35e45b0c4996e7a4dd3385e59e64903642c567492 +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d0151e469a783e235a2a0b4be54e3bfa6e75083 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:390e0528358b6dfa8faaf33a9a3395bd42437d95fdb5378bda0df64f3cc1754a +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..998e15798de54de3aa52297ca4f21df14118714e --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bf15c9fbcbfa3515901bbe5efca3dc646a069ff09f1b8d8613892b9c6a9c4ad +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c0e459ab7aa23480d1fe8e30e9fdd27ce225208 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ffcfec2ae619a4897c6c6243a239fd8a1590e2625fca2b0e0730b66434cbf94 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f61da429a896279cb0764df939fdc93fa5e1b34 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4344bb5a60b15cef0343c8e1802bc7157243cc6c103cdde2ba7363f25c3ffc25 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c71e28a85b82bb6fea580a70a0496850b0b764d --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86d2f5c62eb69f79af0932621755294e6dcf8a4a5b05409beae832044b384ebf +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..553a3b9c326003728a300d6b879b23a9dd040391 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd301daa228ca45a38034066cd82334b1c53989f4b4a1990adb13d71c8abfb9c +size 199058647 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a6b7f990819ee855c5c1d9c2d5352405a2b6fb9 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a1bced4ab0f4faa4fba3f53cbe6481cc3420464e4045aba89b322ba26d65ae7 +size 199058647 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3846acbf6570d4d16d5c128785ebd9f8abc3f0ec --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87323425c21e005fa8b888f0dd8235babbef7f441b415073563cc9a194cfe1c5 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..254c13c9aa66cca6fbe577cb7bc478708a9c6d57 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:764b8e979c830bba291dce573d4abbc11545740c499de3f8df2e91ce335248b5 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e9d3838974bd61152859e21645e36b02a5383c4 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3edb2b8c1d1eb1229c6f645c146d71b6403427b5ddb8a6278aafeac5c3a6bd90 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6c1d0ec696a59b6e7f2f063d9344e14e2fdd298 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:430d70758bee014759b5855945765d89964517e89f031f717365690ce934cb84 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2488bda7a0be408b4a8f08f279b97396f6c87cae --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92839b506ac1af297d7f4981a01d59dd6c54479af4b3f848bb71004f0bf0b799 +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5e7cfa167e949288bf2da8e6be3583adca1cd91 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bba38f43b91da6732d0916edb8286310e746087b956a0df2a49ba6b098d61ff +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e27264245ae6e11d2529ab49ffbeeba91fc0233c --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57aa3b402004b5625e69b68e48a6076e44cbb26a93006668978437226e14c365 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb5d478985c8dd2700164e6772bf140bbd89b88f --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aa2ce7ecb0db346f1e90e1906e262f5c707d0177f74249b92fd04d33aa48020 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0f3fb5e8b1182c7f37f295dcd96f687461eb3fe --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:428ed72cb765c81820123a782d8e06e7c330ce22dd29a3f5bdaf6d118904a846 +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a1525f0111517da65d31dbf75dcba2c7dd13feb --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3675ea6112d98604ec1bb3d62ef05464871ac03aaa0378bb809d6e09b82ea33 +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a8e0de2fad04bb934894bebf926a3f1b1761673 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72fec32a69349a9d6d6d6a8f11915342c5a5a22a8a7245c9ed8cc4b204c86342 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc6c82f5d886a4e92047c75915b1a26b2d1f8316 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3c059cf88ec8e3d133cf605a92056befb8dcbad5df341a5ee2568b07db30b71 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2483356c301cc3ba1dfb7bfcc396a06ebf76e7a7 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf40ab9c86e21a0961f7846d0ad368016df6ec4a819db23f45f8dbfd201fb5d4 +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9e2ff0ce4b348b924dc96c5b751ce43d459e664 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9bd888d74896a353f3050253e703223829790bb9a5c2293d90a8ba91934a0d0 +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf0791217999a3b0bc7d13232cfd29b0a8456a2f --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dd64caf4d268a6c8e4f0b2a844131394ccb53905527128665fe1c334486a5b9 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f6b846ba9ed92be4783e154acdf3d4450a6c052 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f60ae1519754f426cbdd812a81c9cd2a7bcdd66bfa6c2e532c7e616f1e5e1ead +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80551dd4af68b6b1d07c440cdb4c2a89a249f389 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af08c8f11a051ce1823939ee6e85f67cada718adfb321e23f99af762e8b5d40d +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d38644d99b1348447f21a6dfee3f6737608d7d9 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93b17e0a627f4ecbd50a66252773a9dfdc50e716c9b5d5caf9e95a92ab883c3a +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a57bc6aa02cd12563a45820171f741685b42cadd --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9c0e676ed5c7faf54338c95f19ea62ac9342c0c97a41d5430f5af31e00d96bd +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34011855c44b8e9940b0df07f22c1230ef4abcd5 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a2f596ba0b1f216f08e614a12c5ecbe0ace2a9e56ac44751518358db7bf6be1 +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f7122cbe2d3eb707abe0a7ed10f11eecca71e59 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b600dd9ca22f5e42e0183a4ceb6328eec69d21c9ecaef9e700b9194857ad9ec +size 199058647 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5686ec0faf277849fb025baafe2fbae64da0e2a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f2aa875fbba2a8cbcf9a27883b2e0d7e50ceb26ff7636eeb4488305ce1a8bc1 +size 199058647 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b59518fb2e8f9f56cede922fa8d5e45756ae9ce6 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:969805ee82746c8c330db1ef9b82955b3ac6871c6242a4332801205ece3ef8bb +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8190ee64917f887569ebce248140353ac432ffd7 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d49f4d252fc560868eb55af5458954935c8b9421e999d0fac97e08394a107f00 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9311d2a5e0b05a599edc36a6e6736f97a92d80b7 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8208144385b0bcc314b01b52457bf3f8dedce35e9e9535f5fb140d6a3687927 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d7a620b88738d2dc95438c855304eb18578aa24 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acb2317f7c699058d4bd3c1f433d4c5114096b75bea30b940ddabd2c29bf785e +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..341101bb36dd6a1cbe0e1f8c3e94cc1eeb021da9 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d8b3b39be971050b4776ef0ea6f8202d3e233f29f18d06a238187e6c7acc1c1 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82cc9a4502519aa8fb6e0e23a55dd9a79abfef32 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f72900d6778daf4b28d6495d6db6eecfff997b208bd3668b55e0b6a0fe77825 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6376b834f31f9af3b8f8ac09ebb8cb6df5704513 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d407992f5b623c6bcdf382b0fc54432aa5524e734e1280369c60d98a70795fa +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e6aa30d97234264cf78fed89c71acd03f222f47 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb7f7f1220addd45e369a67ed4cd9690b4b6b38acc4f9e4e9aab8f6d0c7ac2be +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec9f9ee9fc3f77c0f11df84e5ea926dfce6d4c45 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76a53fbabaf396a0285cfd4c0582779b054b785d381b5a828d9d3365bc49be00 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fad1fe55084ec321b1b7ce916a8a2e2ff2295b02 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26295b252667f3a906ab403a49b40e4251b9770d2ed58a38d290b93e9459fae5 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b898dcb21ad03d24757ad889faa1c08b630127f --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cb8f68c03bf2fdb1c83f3086da0f9f0f501be3792c053a329fa4b3e092e9960 +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea0319141bf833c2e2bc4db1f5bb994057aa7333 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b744dce39d7cd625d0fbb3c8fff9809c3555f3f25dea14916c091642755ef8e8 +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c23ab4ca59f12dd48a786b0cf62c134bd6342ca7 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b187522207eed96fea68b775e5b969d18128a0ad1266f06345f11c2d49cfa7a7 +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc96adfe81441e4635d6370865d6a9fbe0db285e --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6da76c839f00476f48d7b29243f583ee95e3cd4d78dbd1d80d2a1f4e42787bff +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5f905556dde8c671d28cb3bc96372a9180cafbb --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c5a8a7ff3f0a5839814fe0440acb67ac5d20f5575f6107c06e6c43accb2c46e +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58065734fc2d187656c9705bc54b4e0ce99f94ae --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cc1386a04052a97bc12f1afa0354e07a600e5d5b6b1bccdc1d69a75921d19ae +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a460018729ff2713f0181c4e9ff474f1d1a9f556 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:248c9c10abac18b13b8c023d8162bdcf0b4924d0e9dd35e9f418e8d2ef6cd883 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eba2e6ac7e58d32859799344099e4c11aa3785ce --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b498f5f523a846deaccc43e0f4032d8ad7b53fffe92334f0daf6520c3adf633c +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..beadc2bda3afb558bbb635b48ac302fa35a158b4 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f29d060bfdc06263c026a73f8fa6c924be7de0dcfdda12bf9ed4d70d60f308c3 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae56be1dbbb861f135107d8e7f98869b7ed1860f --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d43d35ecd855c3968cea535a6ec0ea5ca3c93a15cbe31c264799eeda8f76a8f +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fd731491f7c41a969bfcc862b07769c7033f5fc --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b37fd210c5747f0a72276c585d882c07473012da7664c886f9d5ebedfc28a0ef +size 199058647 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3400e838b1b37298b43ebeef2980e2098d54d6fa --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:319b8ad6efbe3e3c419790ba52edef5b5526d343cccaa1ef3c423798d6a9ea72 +size 199058647 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6bc74940576ee6e7ad71f3fc8de316c33d6d71d --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee1804e50521abac9ebc9bb7c8514b744a81389d17be760cf45883701572bcfe +size 199058850 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bcc401b5277260af2ba96d3646515fedcba058b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d979d7fd15ed5fbe98c84fc3c9faf5ee4a704f647931ee0126132cf1e88e3006 +size 199058850 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..997a66fa6dcf4990c8b2a5c38771612b0d5cfe01 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b17aa5d10a96742beccae7eec6cd2c3f78bf5d1a1d777513ae3ca6e305e5fcdc +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..276e28e97648738b9ceed2dca6c91bd340cac1e3 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caf49d5e823a6103498151682f553d035a73378a0e7eb73246a5b4653fd3449e +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..636a0f1dd6fda40e316052b9710317bd8c072f4c --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8719a703a6d51f06ebe667b04af947391b21464bf42f19a7dff00ace98a6a997 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d37fe161e17a9b92dcefea6668eb8fab337bece3 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9843977291908b4c85402f73be7078b652fec55135b07857dbccc9e8a603fe1a +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3c8b347ba86195cd84b40fede2a0d9e391d5c27 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9dab81402c25e152e224657699d8a1f5484f52ceba2c3fc2774aa81087f8ff0 +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c8100bb2f1f5d0958ffb2a08a6c0a9ebe572e8c --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:040840e7d9915251c0f15ac5b9ef8429b9dc6a785c673d656afed82e3e20905e +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d2efc811b4e2da476bc8c50c36ca02bf95222f4 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28c36c9791091111b5a3a6bef652944565eb91e1412b96815e94e1aa652339ed +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a8b21255e6805e6396103bd2456fc0df4866b93 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d166256453658dc8c484524f0afec76cac8fe2b21aa804422757b334c1391fcb +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d3f06493404c3b950a2490b3e36e3c3574573eb --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf70a43c06689c69d292818918c305c6b9e30934b5af7ed8db609fc3f6cc31a6 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d809cbc8baaadc4b2cc11e43e23fe6deb60893b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c034512fa85c5932e7472656dc281088358eb977885e6e702152043316e71f6 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5dd9b144cfb8c1ca3b0a56b0be3f3f8865f60fb --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dbf4ac092ffdc4156e15d44e04e9eb5fcc873c4166cf222ba4913434f6bf101 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb630af5d486382d83f2bc5ab165116a7307d91f --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05f0650b6754462cf7de1e3c5353b28b25b434c3a5a4ef71d7799193870632b3 +size 199058722 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7512274c065abee2b00a89794cf12c141a8a2dda --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70a41f522ccb2207a21bcba301d0f8f9348b5d069877327e5e8a7813669ffa6c +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdb4f637d8460b3b4d0a59ce4ebe3c6f6c803f48 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2386413afbabfd83230c6f4d530b24376aa29b043cb0febcd14ca970687ecc5 +size 199058786 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0eda31116f2bae2e3f6f629ec3bbc54dd92e3a64 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:768a73ca8d2cce015963278444cfc131e005743d8b623af0b1f2b42e71fea0c2 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cf47e4de457e7aa859af845e331554c2055e0b1 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7671a279b1ed061f43215f36c8b55effd45e1eb38295dc9699486cf3470f88c3 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e2efbf191f1a38d2698c08811e72af58b52789f --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6f99542072ce54414ff94d0c1bf763c331c5f59212cdc58482d6758e4cf4fa4 +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ab64bcf5effc0e75e4f046eee567655b1fdb076 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a983c383283a52e6a5d87696a371032ef08b6848fc99a0a473799fbc9b86e9cd +size 199058658 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8c8fa571126c4f075def43699ba7a337c75673d --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19c4ef00f3fa343f022f58d93f8bd14381b16a4d0d4258aee8b59380ba7629d0 +size 199058839 diff --git a/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d19e0a214c954f0e1f35714557d7f6af4c8d1b3a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:067aa83164a5c5a1d88abf2cfafe68217a40fd85db4592b9fd02b399394ed43d +size 199058839 diff --git a/4b284b84bc4seed3/global_step80108/layer_01-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65977e2adb356d589d125a31488ab2c943995275 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1ca53641f0a0cc36a00fd1f8c59e0a45c48464a23ffa3e518fdf6c1b23ffbb2 +size 167511299 diff --git a/4b284b84bc4seed3/global_step80108/layer_01-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3a15fb30815a351b3d0707fd788452fb836c1a6 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcd50a01bd352b4caecf1a33848150a02b95ffed5a36e52def7ab8c0e980d072 +size 167511299 diff --git a/4b284b84bc4seed3/global_step80108/layer_03-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef831cfddfd373788f80aebe279031f2d0e92b27 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd1724b355eb280a3fb5b0a2d09e06ba0ce0bec8c11b6f4bc6998a3c3c67f106 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_03-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32a65cb1684822b5cd4a73bd1577445c4d54ee94 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d219b42036dd17d5663ed2ebe34c977938f7fb8d21c9b2ad85b8675d408aec3 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_04-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2502834acdcf8fd5c5eb898cc8b508ce381c88f8 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66cc69027510387f518607b439be72cc5b1850240a9a79d32c5be95f6f969d77 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_04-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..444050502f4a69787477e9d00900846807d48974 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eadc31513daee6072b053236398405e539991c0ac8f4acaf4990fa57725ba8f +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_05-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..849da03b238eca40e6a919fc724ca0114f4d87c0 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9da27fa11e012da12847bf0d048e140a84440ba7d2f8586649e316ac9fca03e5 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_05-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91172c2b34dce524b7a4f297f2ecc34d36f38899 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6058f0d54d4434bd52f3b2272f7a2f592ecb3ce7810494c161f6b2211244c81 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_06-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84a87b77aba7501f92fbc4eeaa343ae63e1ee3bd --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f174f51dc9471a3bdbd159e70babed190d1f6f61c6e316e5d3a82c63928a63e7 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_06-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99897228551cb563f99dd684596fd7722de13995 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6ca98dfb0c8d420e3a1c85109776dad4e8a36e0cfd1b6c9c36c44afa23ce2d6 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_07-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70ecfe6feb033e613412a89a2141f11fd6e9d65e --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8be3a8d347f6611f6c337a64109d4507c219875c485129db349cc08b30320d3a +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_07-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27c6aa8f2cd6b6498f97544f84c4c51ff5b847ca --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87ef853909a9738735cdccbd654da2ae3bccc8defae4c2bf3a329f09ac7c1f85 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_08-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1662a1501df7032a6e9dfc7dc882b6115e3359f --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e50cc506f8d4e4c4bb8b94e7455d847a0f085738d828dc3a1ef7de0a10ee283 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_08-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6668f563b4dfe01653065fa0f6efbff1469a2581 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4fac0a4ffd80b3016af2b5e55c25868d6d9ed7fff5c628c120eff6a130053f6 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_09-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dc157b78be611095469a6d00685b44bf018c32a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfdff81a11f2ebe0a5815a1e0977aa112676bdeb9b2650d10670c3ee97977e34 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_09-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2969ce61f49e13cfc049f7f575701b14c24e694 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6ec31948ff6cfd8eba72e2e3562bc590b2c9882f9c2ebcdf472ececa7b1a0df +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_10-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84bd4da638e961967d6149a3e32527650fbec442 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6c63ff869c405c22bf78d1c7da4015b60b7f80904b4ec487e08548ac4b3548 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_10-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..140c40d3ae126070267f5efe18f13bfa3ec1a21b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0415d118e683b770ea9796fb09dd49bb0534603c074dc5d20b6caf8736664b1e +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_11-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9b55376da7b12f98cd90fc87e3c8464cbf7e960 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ad97a5739f9d6756f9164c8960a666b0abca0b60ddc15f406c45ef9ac6727de +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_11-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ca802c8b4498cd80b1938875db15e62d4b3889d --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:211a3e648d5ae68460bfea328590590f559a1eef98873b49f689d2380e9bdc5a +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_12-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0fcb34ac61432df81e30fe7e3a9c359f0920f7c --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07d6aaa08662189058d2688f0d06caf4183e30e8ecf22f813fe60f8bbe16566f +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_12-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c6a6db1fe6f54b951a7afef6501c8d4b2d32228 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ea243d390513fe2b7f13a40ba621aa9c1e78c5cefdb56f8cd941dceef913c4d +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_13-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9403ff5d1ecbc456ebd756a2e7063f4721dc3838 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e656d69dad56e50bc22cfdd87a849a05cb770490d760b09de58e6d996ba5448f +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_13-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f577a53fc138ef8ca3f869faf44f9eb628b0404 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f009f7745221afc96c19313ccda469de7f959c92e8edfd6026a0fedb7a36d9e +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_14-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fa34c07cab7b813144b845e722ddd7eb59f804c --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7a58605b8aa9f7c5c7cc3fc7c701a49347ea4456ce617b5908cc4766d37aeea +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_14-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..444f4c5e261d8bab61cfcca3379260d7c4562a7a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbb5d8365a5058bad1c901123b0805217c9afea1b48e5594413dba26055b5729 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_15-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a284306633f268650cdeffa27263f119d7eefe5 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce4d4ed210abe2336b8a4ab9b9614919d1a6f9de83db83e2de0b2c3d8b7f9505 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_15-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebdcb3bb97a9d9d20990293fb0b7ba5355c49da6 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:117feb85d3508fdc25b71774cc0f699e483f4beda1a7a2f8f131ce4fd58b138c +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_16-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44d85315be55c9ad3d58ab60d52a2b349bd01bab --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca0ade7547507d70e1ae5126bdd22ddb8399f04d5006a3575d73a812f85c02d3 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_16-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04856a2be6ffc27cdfcf630e873d651c0246e03e --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79660d65bafd91ec9be92b4cf17aca5d793c9294c54d5a412729aaea4ed27413 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_17-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6983849940c215a1cf319c5d6da9f4d8e14e97a7 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:533ee472c71f9728dd0982cb359ba5b50feec1603d2766d532b6e49b60bd0bd8 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_17-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5c450b01b5226e304aa2dd02e334906f1631a49 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efa44be025fd298cf3ae1f5befd53fd2e39a10b2df5319d002fd0f9d5f39dd23 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_18-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee0354f0f19b6ccf45254f65dec6f9a613770861 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60c3fef123980b93ce7fd973d36c47204eac471140e278dbb49c8d3e5071770f +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_18-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bd06189578d7b946c847c876c83033216c2b56e --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef276c3ee32df150f48bb1d2356d5d5780268dc23b6b281779d01e0eadd18b44 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_19-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c1a1045ac6d8f1eeb8005ca9b3c540a6077ccf8 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09ed0e87ce8577ebd289935ca3c29cf2208cb8f9e7d00c210635631968885546 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_19-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fa9b7667da9f848a562086341045c1d9315d296 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e4c43821a2960f844a6262db9654dd47068cb7040174380804a5779b5c4e5b5 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_20-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..495e15d0154756c859c91a33262e927a746a6ff8 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:531b110b83f98c314aad95f924dc0ab54fe63f4509dd2327c6624041f0d8193b +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_20-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d7df636a7837c9c6efbde600eb1cc8d20944965 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cfeb17a3489d72fc6498c970de4b7422acddcc8e0168687465e31d3b09ead4c +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_21-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8aa6ce423c110f520d4d341f870bd472a30ffb61 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33807868e6ca84162b380d02a67669790dc78e8e5f9a60d0b7d75db23dadccc0 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_21-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..546d85b03644f822b0c96657962482cd1712f2b5 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b316e975f3d1ce445fa376a4816fb014ad8bb2cdccc713621952da971d2b279b +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_22-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fafe43dd35ba7ea2d5dbae9de0c0cb35020aa335 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:431bd5cde044702562957532f929eba2e240a3c6a3a0a565761670cf79372101 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_22-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8b082c945a0a8630c3ccc1a15f9da0eba523443 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70281a92281f319a4fe3e536392486143b9878600207fd3212ff9224e9790188 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_23-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5edfd22a2cd1751473d1a60ef2e4d7b497d0fc02 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:033c4336abe6d0e62c01340bbd95bb67feee0ee500b585e7266dcb987cfafe90 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_23-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddcf14978972ff19c27bffe2efc6c2fccdfcbc84 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:506b72f8ffcf6fc42d945e2c23124baabfc561de5c90c5d0bf51765440845f50 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_24-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d053cf49571b591313968bbf3eaedcb3cce64e6b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f766646bd5a9b80dfe7e9a03c931c93667982d078a0f42ae74c0f97ddb59cf6c +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_24-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4be04adacdbe7b15b9033ffd05c49ed82727ac0 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70317dd1b65d7e24be7b1bdd280d0c6419fec2db6daae55ed03f16da7bed80b7 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_25-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0af64a8f4dd3c15c5ea6adf27951934ff12ddb4 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4504fd4ff87a22e173624d2aa90c3c69768f6ccce576354d2f1e315d2d546ba7 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_25-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36f4dbab36e205b7aa567886f95c6203c4daf650 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54671647ab5d9d75fe2c3bcdcd29e0fcae3759bfb96bbef8b5f08e61a9bf8bd1 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_26-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d8d4814f88c82ed8ffa4b5ed15dd1f3c7c6a9d2 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d14d85ed85ff8b4492e8d6a141f3d9dafd63d85c88d98e7bb9687bb698fe38dc +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_26-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84276c23db01402f18fd6164874052dead7eb0c6 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:639b5d73d312c683eab4bcf15127574ffd0780408f5e3621dc939fc01f872f26 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_27-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32925fb1b8ce1f8968f66e409a7bee0bbeaf408b --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d55eca5f652cc2a03267fa6033796d5a31f27555c7feee9dccc2280730ebe44f +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_27-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..522279f5a1e1e9292b0f46f7fa75ae519673564f --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e0aeb10248c618491fc66b3460422b32a997dde4d2f923714f41eff2438867d +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_28-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81b024945c790b418ccced137c73fb64834d2436 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51cbaeccffadd80d7e391ff89d19bb86d9aa5c0cb47c4b8fd90ecc1b3e8241a7 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_28-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..265f3b749f1cdc5f5318fbc6f95bcb1de203777a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:180e42b9000596314be2f636b7f0efb04c4af386e7894d282d24a42082f28a2d +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_29-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a18da2285e977b3131ce8691610f65d0e905050 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed96b837da5596650fc9ddb1d1257587ee033ec083f48044a36e5c6827f63286 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_29-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8bcedf4597818463a924cd5cb1bf87a332375b1 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73e4761830e2c29596700aede825c4c6a6ec35f5623da6295284fcf7be6b0c9b +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_30-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0377f79bfb1c5717c27c4e1503887095bbd81f9 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b12747a3d31f7aadbda1798d6cee362a44982ee215d1bfe3f37c8f949e598ea +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_30-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..abe1ffc0cf3dd878b3516343466cad93477d3dab --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28ccc0f31e8f398b0798744c1cbe9828154ba7fb1f7a46c1af94de8fc68fb5fa +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_31-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b48671c8e9ddad9d445699634601f5b95d6c65f1 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eecb83c06c8d229a6837b7031217100ccf2e820b7e8c1748b870353cf2198829 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_31-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..930f527e9ae44cd7303b84b71b5ea39de872f36a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ae594a1bb74e96751da4b1d183c314ac33e811d5f20da001135a66b52e65f90 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_32-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..518a8e88ffee5827a8da105b1ac902e91b2853f4 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a04c229ff1bcbd47dd9eb93a8cb37232aadd7dab130865d0dd46b41dd4a7412 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_32-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14ba722ca79da4fa1abb7f2c8775ae1ad67a483a --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa8790f661d3fe30c78674672c9b1cf851fceffa363001563a9e34336bb33f18 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_33-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36506c8cca8be82b15cae166d281a85da5b3f693 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4476f58491a581645c116b5622d210392694ed3624346106c0030d5b7beafdb5 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_33-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab14cd4cec1807544aa1b3179b7ffa51bfe65fad --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bd8a772bc9d5c8cd226fb89ef6bcf7c66a45b760d8df8709d4cfd8e4f549a98 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_34-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf22de58efbadf834f2e90c7cdae71462353f062 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b1d9018fde5542dde4cc6700f90b0dba6ef93a0ec9426f2a2036de809bebb3f +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_34-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ea4fc41cfe621125b36c260c136a8848f92b0f3 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9d845aad477201411962aade9a3a6889a6d80024d42b26cb34913f1cc600344 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_35-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08e967e95974d242b83a6dbbd45e65be61bbee33 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b55c5fccad58d2faba023312e990a62225460870cb9046f5f2a86e61c5e2e6ec +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_35-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2680ea15e35c923b67ad0a8dde5c4b3c7d553402 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cd5c57c2cb3137ba73a48c3b10a0ff1a8233a6b4ef157c669a79862af804ab4 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_36-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d43e859e65d81ffd0b73f69959e33a99c01767a9 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbf8dd68e67a309b8e1bd269fcdde4e73e21ecf9fb205b95239477661f4f3d3f +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_36-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e86f8601983c81c6d2aab6c1d6d912fbaa152d0 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8be1d43b1cd8329d6cb57c8ea8da7255d419f5b9b05c0ceb7798eb11dce54616 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_37-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be5ad6f00dce013ea1d6cd19a107df8428d30721 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30592896fd1079197b47a9601ae8e81f8ee72ee7d952e8cecd1c3cfa9cc56244 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_37-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc5a8d0953629d29e2252f59ddee630d020a2b87 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e21928332ab73e14a1bc8f7cb0dba59dbe56e730399e7f5c88d3acee1e724a9 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_38-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d6a6c10a61a34ced00e5eac41cd9eba6d485b0e --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:654ff1f3278e53785ef37e41767b126f79a23c4267aec47d3515fa3ea9aef2f8 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_38-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9ea9f279a5e6c2b03c5dcbb6affdfe3665b6ac3 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2281046dcb6cc5577e51b6a5e6ead9f53ce3c38d4a974dffaf73df6fca83a666 +size 113308931 diff --git a/4b284b84bc4seed3/global_step80108/layer_40-model_00-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5074d0cf7244023076aef61d5c8a4f24e791286 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48d4bfe3cd13e0ede460a92391b0edb5f73c7dfc30dc806bb832b83c0f648d38 +size 13507 diff --git a/4b284b84bc4seed3/global_step80108/layer_40-model_01-model_states.pt b/4b284b84bc4seed3/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70b88d9574aeea125b844a96c0333cf03e451a8e --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aae175a0a587748bd99d8846830c54fb954206131d24aecfcdd38e0ee2eb4666 +size 13507 diff --git a/4b284b84bc4seed3/global_step80108/mp_rank_00_model_states.pt b/4b284b84bc4seed3/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a354fd0de598c9363a2deaf3d5fea24e4dbafe68 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:804719a34e65da3e1b9f209d55c68adaf83e1feebe6be6a0e371a9369dfbbc4c +size 51443 diff --git a/4b284b84bc4seed3/global_step80108/mp_rank_01_model_states.pt b/4b284b84bc4seed3/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99246453a420168ec87e02fc003517d8ca295ff1 --- /dev/null +++ b/4b284b84bc4seed3/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa93cae611887d0ed55094d344e8a38c19a9c381231cc5362481ff692136e0ba +size 51443 diff --git a/4b284b84bc4seed3/transformers/config.json b/4b284b84bc4seed3/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b84bc4seed3/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b84bc4seed3/transformers/pytorch_model.bin b/4b284b84bc4seed3/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..58c1c84eb2c6d3778af7fac2573cdf7ca79c8fd9 --- /dev/null +++ b/4b284b84bc4seed3/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e49ca0a72a71900e37572fe0163e3e080c20bc3218bf4218e1072f0631f4b014 +size 8781203669 diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..4390f90bb94e961543ccad360bd3c5b7c11dfc1f --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3523277002277804, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03261401734869028}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07140357303785742, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017735064753741127}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2938068811232804, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004698591443703581}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10590846249521367, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020195315762052673}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.033440949253294806, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001066168691596413}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.14239106266330545, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003163086494032039}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.050108480283474685, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012479824947943812}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06888442229810386, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001675844279268184}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2866580974880424, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004577594263202556}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10246592063839631, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018904079137483055}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06827936311686421, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001698555616698455}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.28107278592336027, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004438130822299941}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10120297741035127, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018969772318448463}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ac87fa7a1a7083c954600f2b90d7df01224b10c4 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4351779771917347, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03461044967042056}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07162194662437592, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013087409774892172}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3606308247426329, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005204874863706004}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11195633719029822, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017956976300324953}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03355406237669093, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008232466042918183}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.17649806895632947, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003573445474921975}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05255280813689339, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011567693373819863}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06810242914702684, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012110333378022905}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.34048847512021524, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004750749477340653}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10647953810824176, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016760663905838954}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06848895184352013, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012480162482644015}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3429613098536967, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004820988766109633}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10693711806502432, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017046988764721166}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..62134eed8a3c1dfbd9a0f9b76109321220a8db8e --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4447149214180348, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.018972548555560714}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07269992209256788, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012516992696440586}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3753121304840736, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0050439493858917194}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11462405866857102, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001736014539262953}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03404844764438817, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007680445086395626}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1879602254006144, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003710463717182471}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05396475791939589, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001107305452781615}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06834435101252613, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011410779513936623}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.350761541750936, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0045336528849166365}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10775063055928252, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015887580065971389}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06935895852997251, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011852302620070257}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3565184552784119, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004687409183137695}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10926127364577738, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016390081021653892}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..1bf0c6fe637e42c6f81f269459e83485b53d014f --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5087674664658492, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.026893638286752154}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.072497531691811, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012026919993320111}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.38474435436270493, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005142183312772921}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11467972816113098, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001673200203783686}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03380876275906201, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007518942865145289}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19155642039509754, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0037517387263905507}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05374249345557979, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010894570854945713}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06774922502819766, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011043288246760676}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.355788174091109, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004543365107062434}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10704454572486424, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015340338132748832}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06899862406820627, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011409968694109725}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.36454854774413287, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004741615558398587}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10908169881982438, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015837111282973452}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..974b93681eb6e0047e1fd451f5b24318342e2ad2 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5913746773860721, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.041085758656651254}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07471728852529957, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00120444126407064}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4024992804481891, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005245342121017829}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11862510680315241, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016779930474832658}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.0348700360833608, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007408153164874413}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2036124062513765, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00387597600568855}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05567978816710457, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010718834740964826}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06888490676353087, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010959048971556757}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3672784960986926, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004566861844635672}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10913463867270404, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015113181951666658}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07096869733176525, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011452901218571788}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3804621853389486, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00482918129805665}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11255292648692071, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015868430386374208}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..af28d8b16f4203d9b37f5f21f3a57adc431a28d0 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6304604966593631, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03484982021747957}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0744328271529154, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001157549734274375}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.4127612356762462, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0052523273943021025}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11884850755997649, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001616705319256009}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03482016206562085, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007258016003322981}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20894584695108945, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038600278798887723}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05592752125205284, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010528579472296477}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.0684803394428656, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010698339353882353}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3750129978505135, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004543607982881679}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1090677963632186, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014765997700889857}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07077155348314326, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011076088583072189}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3900673103247878, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0048425468419916184}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11288876880831, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015402308170382386}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..91a56b35aa1a5514644cdb491406568cd4c3345e --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15130222816102726, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018641353605878376}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2585048040019072, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026633037296359954}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17708913864416292, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018212193534322709}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.030354095195740356, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007454497776331851}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05433811946884532, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014397669916064314}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0358183863771304, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00084133860800268}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11775252929311998, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013049047450472628}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.20864111880992672, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002169509233782621}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1395967400507796, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001313393024815337}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13805300047109062, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017010449743815584}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.23676218222386985, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002462862595699301}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16174636673799278, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016649134344973989}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5421125542141876, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05756547176107712}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..3d0f3dd4b62133f5456a8543b6f1d07ba81387c6 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.2194647051475106, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026637127905829957}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.32953538987527364, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029752735913270213}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.23390150161377168, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020117545140889465}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.060079962682567656, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015430426704356244}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.08864081298208347, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0018541652458318118}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.061675743964392724, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011660228294911223}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1539694016100103, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0020721550784059055}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.23350379059815546, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002302352375151091}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1623726890739185, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013550604960878186}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.20602533584010463, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00254117072503622}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.30941435638814363, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028218530563501962}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.21928618412182982, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018889547156816118}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.1118566247604162, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.062088508469292286}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..f46109f0bbdb00d9643afcec92ac65462d69e0c0 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.21230058363878315, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0024080619207750963}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.34134579643295393, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00287291808958866}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.23819401638529333, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001961472755718473}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.058180340769663996, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012366998672630046}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.09448704160727436, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0018410055564769775}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.06423744493296574, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011237343652403928}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.14716839436847945, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001723324637255188}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.24371061167078392, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002305940409051167}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.16572553377575022, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013269375688079502}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.19985650365773666, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0022791002962553927}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.32205265894357177, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027492000000614377}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.22428067952847994, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001853122562183745}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.3250803512114917, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.043720151005010505}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..d5fd2edb6d85f298ad5574e3fb1abb59c7c12dec --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1759676944241637, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002599503777933057}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2783528249629676, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003439775464191638}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.19371662716809854, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002332163732000944}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04672040323211839, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011635414202250617}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.07600165390612795, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0018062659171568973}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05098365238098847, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010739239370527816}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.12481870305727255, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018681974052869646}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.2032107116074926, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0026995788494260085}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13757683764937148, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016125055112952101}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.165693431417505, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0024409611879563638}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.26318808414968303, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032807386039732994}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.18265210486261796, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002199082319355358}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.264795684563816, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0665539830427249}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..5ed458b1c1d4efbdf10f2aab1d032cf39bb38c0a --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.05753559661305722, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002138715660683914}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.0930047418871661, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0031434712495670048}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.061810069279221835, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002050884974045622}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.014474681217716064, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008323203723133832}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.025504176001051017, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001303289046442984}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.01571321711438463, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000725772297710108}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.042660119298722994, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016477900120572672}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.06969950422653938, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024116366945608377}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.04536102247912932, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001487864376367666}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.05421281196909096, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002025499714973123}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.08758632873317065, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0029650946931968555}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.058117132916654005, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019249371066501861}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.7399731218010301, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05315913015718361}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..010d19ee8d9b92f604314aa1d931dd34c819fdfb --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.009165990245767591, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0009442979407312777}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.015418596799201417, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0015077442548408681}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.009774296059399336, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0009080621408899851}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0023451269499108907, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00034470873041317335}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0046018834347627035, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0006803082985888496}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.002509211412713389, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0003022299477574736}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.00678359535997039, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0007097335601922828}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.011572236419649438, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0011572136947999466}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.00720761001914484, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006681163091531024}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.008486993163393306, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0008690259306885085}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.014459769727609291, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0014158078041286931}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.00912075895864339, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0008473674103987658}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.7124193494262821e-06, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 3.2741945230754847e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..89e8383408ece1e3d2a749ad72589898364fe260 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.05808891716691411, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.011333330592580656}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3023091414929599, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002913887406749905}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.12238985523242189, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0013610627775538216}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.13899147577262666, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0009286294871679315}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.022775128205128368, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011384359586054489}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.00610855031631702, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0002896485948013325}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.007854709999230764, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00036516539565493495}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2745392561803429, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002727571611712019}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.11483479288312695, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0013803318617414532}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.1275827225198627, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0008841123038167355}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.27555523169576246, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002926670520914391}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.1020509279394632, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0009751330314082834}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.12203235569838602, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0009202893055765295}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f17d40f7546300aa93d78da4703b7824e3fef5ba --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 8.932841105621064, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11441707444147597}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.44530595662757727, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0036595275413873183}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.42827303768403047, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030343030656821836}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3974228957995462, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002320429553502724}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.20230936163095836, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025036401909577727}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.19120188941717492, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00210380636425424}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.17753845874321364, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018327497034708936}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.33275929259548276, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00295993230865274}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.32342830006561096, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002557175371249573}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2971909218049089, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018836069812237484}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.36536808388203507, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0033140674546694128}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.35017983210590575, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027753545840717682}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3253556432256207, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022142373615418754}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d25bcbe77c5efc58f1c08215009d30f7bc49e85e --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.880063105811095, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.17984450139554475}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.506737464401302, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0035936965647612898}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.45038732838216006, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028591739786909026}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.44505676798399185, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022811968446148742}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.24833021143506717, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002726123256626373}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2167301855181476, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002197696079985957}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.21441790403427352, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0019873610836182685}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.37992704007005046, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0030781300319706554}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.337552347296149, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024789904236623512}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.33281096535989263, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002027510114174692}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4242330670183315, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0033488862052480383}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3763581811094256, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002695938632190225}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3722406759710508, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002269175188375031}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..90aa0b6863ca5c09bc5d54e9184e95f950433a45 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.520921591661882, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.2718380639604944}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5070856834398472, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003526888789046483}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.45723976171215824, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027704797956913073}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4521518805319402, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022515279038786227}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.255120829295647, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027246646455271546}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2268268997863891, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002237190631242654}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2242096802521301, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002021997464706373}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3810377463717816, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00307213165006003}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3423151690624315, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002416743374863738}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3385818879988679, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002056019295521777}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4285263610786833, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003304605518552052}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.38610636284479233, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002654435476507776}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.38189174321776803, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002258684314720834}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..4753b06ae17da99836fa399353822f4e1060629e --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.831367617602877, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.18248133751970383}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5008213879398539, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003448214786347665}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4677552019051495, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027487310914847602}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.45672550688868757, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002254562843922049}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.252653067142654, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0026728213400761492}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.23421861425493357, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022616561003861407}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.22808412145632054, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0020391687587871005}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3751971515131376, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002976831493826089}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.35072100299356046, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024722233464228543}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34183112110248615, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002088453787987109}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.42516588170775854, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00322080090809883}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.39902571740048054, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002736668954410199}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3886135908143339, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022942589711889686}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..5a756c75d94db0ae2220e3d4b124a52902a222e8 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.476649044527553, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1698766854636743}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4839633098425305, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003299267823766779}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4705499697275458, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002738242144292685}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.45208098619239717, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002213005671732147}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.24091846485732277, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025436868155710828}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2320394354997667, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022071751737241835}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.22264024747277225, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001987296116486491}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3629543396997906, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028393546604920366}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.35264832664365503, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024261289166555506}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3385274428827769, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020319683310434395}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4137754251875113, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003126258632288186}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.40238964616699796, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002661265077082012}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.38655176446890444, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022484585467573517}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_0.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..797881b0edaa893036964a2d78e66e95fbdc44e7 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.15896903592047174, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002308498075214904}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.32151606833527474, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004467750436406024}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20307234782166939, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00254398638712588}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03326326936108637, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013115215791441866}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07276812864417066, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00266495974490086}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.043691698777011345, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015720363515098195}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.12182880371774332, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001818918777245228}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24834119210557543, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0035628091512773206}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.15593841528849953, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019887757192407814}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.1227952289626782, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018764392535370118}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2516810661517101, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0038501177791414915}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.15748185679405513, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002117052212384048}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.9125252340175696, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0939254181938478}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_1.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..dcebbd72ca71b028aec4f1d7655fdcc4cace52c0 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12456796192309169, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018663225428676555}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3033782811263302, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00435632341852972}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17438840171489733, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002516782211263018}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.026297340000885697, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001027838408615643}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06688789749645495, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027125026315894404}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03725757946128431, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001453910826534785}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10198505059076171, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014701582863370355}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2506401563563098, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003651091960508788}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14307994211588798, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002005379862853747}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09637711275571659, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015128974074199704}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23772290217746403, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0037666734496558294}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1353866489423388, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020762039106271024}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4234140719501784, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08008244099582335}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_2.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..1b638867518df2a9de03f51108162eb8cdc26991 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12257166429044594, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017758091493012137}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2978206183170451, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004153358896452572}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17150651760394497, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023907265926706956}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02653075423531747, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010100537686758024}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06731490725572081, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002670773143935172}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03757086142902083, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014307603878365935}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10424146003543594, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001484600288621153}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.25471602692648093, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003610349405448802}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14604747569954757, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020129836183947333}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09373790710180954, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014469445596197233}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23028725682485185, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0035926993484314182}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13155136268487863, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019833919805789246}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.403058154138598, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07947986565662277}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_3.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..3fce67fc86852b8429e03378c782c60de04df736 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12212159195548629, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020413508418911223}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.28379290430795073, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004300429318890937}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1664704853916206, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00250451940953418}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.027086922588921557, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010893085545950853}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06560470949712288, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0025928364606295586}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.037348548046976356, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014490141107738803}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10394812833382235, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017256599090190122}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24318873056030976, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0037594406422229213}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14204750890662055, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021403616377412287}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09419477661930503, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016768519118452933}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.22033465049587264, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003618847956030538}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.12846242652343276, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020450420326324982}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4860485963618193, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09363961497980915}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_4.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..9a0d2d5ea0750ff7db80a6f0e69adfeaf58e849d --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.041843850057486254, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0027248704585387203}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.07170804112417602, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0041857327071730364}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.047356647789818455, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002748168768611129}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.00975684909437077, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010812973230085907}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.016640859698859974, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015451158301785048}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.010923150617633553, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001018598314862772}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.03544031461665562, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002305692160527795}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.06079313428910594, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0035266276653790293}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.03990722372366724, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002276301239159138}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.03328647749360134, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0022740307934491265}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0556921853671952, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003318230068428034}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.036847659155334334, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021765624675524546}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.8326562560108917, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1467525734431667}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_5.json b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ac4b71d0faed48b00feff4e0c6c3b0771ac9bbda --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/agg.4b284b84bc4seed4_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.003243188732265197, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0009910456520478602}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0026536470502779067, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0007340423451228517}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.0028438767697741185, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008091353860408605}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0007579961658762991, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0004164644743745851}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0005294862370334068, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00028364001336350907}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0006098723079855157, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0003241318837354033}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.002549580362974837, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0007512133719590526}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0021600686497647045, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0006036544336792427}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0022743929327468044, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006386166431455819}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0028617335261268903, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0008958933741864754}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0023705346379101037, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0006744765626606669}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0025220053356973726, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007351598994991656}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 5.230211901475508e-35, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 5.134007383899523e-30}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..342b869c1d8338feb99ff12003c0f31a75a97213 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59bd870aa312bd8247bfeae14906646197c6c9cd0a310e07cacd6b7a138e03a5 +size 4141530 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..323aa9d689f8288f8f0689b0697d3002e90c8ea3 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fd20ecb2bd0b599da2f54db28d5fd12418312b349cf4d83896f26cb3291309f +size 5114616 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7dce6db54f760dcefe713772fd9e192efc57d5f8 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19e0b79843fef2af26c6f1ce9558d0775e164d18e7049ca64ffb293bd7b4150f +size 6026069 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..857e2c0162df4d06affbf0cd6495c9023f032c3e --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24393b3e3a598781aacb9172798fda8880250d9f35c9d9bbe71d890a6cd05855 +size 6941735 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..25edcddee02e139b098237c95d18f93493e7e28e --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:176c0e3356ac46316d46fee41f02d0ce96a2c006be1ff2b633fdf8c08e29df0b +size 7842382 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..46adff44708423850069fd3087c7c85a9f46d359 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a8857ea8ca12604f51179490c09e89d3d34820dd159d8677b3455b05c31c7e7 +size 8760072 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1f3bcc6e6e4cd23d9a2768ba48ad6d604ec7cd49 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a8a035f0cba2cb92a97bbd6bf487419bfd8507ffe3be53225ec91ff9f3c0941 +size 7698807 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b0d5ace536fcaac9a1d0971d6b68af543f22626f --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8057ee80732a3259b3c9ec385cd5bb9270356bf47b85e288d49860cd9c62dd5d +size 13294750 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6ed33c39e99d0aaa351a42734917b15a8308eb99 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b39ae725d2b79314df120bcd1b08074cf44d69b49999c87d3fefa4ab1ae5b5ef +size 18923084 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8f98d4bddfcb28a521fe9ed822bde591490d17a7 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63c93fb8aa70eefeee7b407a0a172356711e12ce7db25aa81cdd05d112da8849 +size 24345273 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2ec44286fd5f09d9d2b8a555bbbee6d3c7f7b38a --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4c7936ad16b6693369edc6e348e3c2e85762fe3a581a4a1e7817f030b50a3f0 +size 29479723 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4e41830ee09f19274bc73551c50a3be95a0f15f7 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b234e7ddd3503bd4922a158874c82090047615e30ecc7a5c6f67c352ed53f3e +size 34800879 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..61ce65fa5a342bd74dac433bade7b27eda932ca5 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc669013ad3008b3f21c25437e22d1ebcd597037fc7f27ab0d0785ca7caab721 +size 3955030 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6716502c3d4f7c14ddb0e97e6ee82ad126f2fefe --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e14fb7f875b83bf041fbe40f4f9524a0b9660df9652156fcefaa5e371a9c0c9 +size 5172751 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fefc646aa86675a74d6c4bbd2efc4b9e3b3c6374 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cca5939887f9e174c59bdcb54c66295d7f08da28af309eaa8e697af0971dc31 +size 6192641 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..25c69c974d645764a465ad7f82d9ae06d23ec9f6 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6296d5fcf3e2eaaab40269fe2edc65c30f08c3fb7bb6db818a1d08ad83bed737 +size 7277111 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..70305a1663023733692f6fac4d8ed11f6ba83b4d --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d97e42cdee6ca3d40eb7c28c6e685a2b9eb45ef46f550c7c9ca3fe0a144e163 +size 8365677 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8ce813b6e1d6ce53e403697b848fcf1094837cfe --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a85e40c267ad0ff8e5eed95858c7f1533a1fbe9b052cd1c6c6c6cc101de4c98 +size 9463778 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_0.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..430c3968e7d9d24828ba4f4b656128dd4da6a69a --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b4fdb64cf160d3e167455a6537e82115067ecd47de963063afd4b3103fd1ca6 +size 2794519 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_1.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e25e42607b72b161e9850022524390bd5eaa7b4e --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8904902ea188c582ea1e458b91816b52676715e8bddf80e2c1cdf1ae73bfc54c +size 5104420 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_2.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..56fd61c49f4bd9482dde23b02e333f781ab0dd19 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d256f0de853321b4b094fbe71535ceb65b9fbc6404c5cfdb70d9e9405feb20c +size 7378216 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_3.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f9e23ee82d970a8ad293d2917a833339786916a5 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ac4b382e838c57d8748317abbaf3412b5f27054b775efde1d3d3c356b0e6e29 +size 9647607 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_4.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b4eea031a9097c5f97b7dccf2afae1d10a2a379b --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f09a93905009b0ee28a078aee66e6e2502fe73387f1659ade3293573f4d3ca63 +size 11672483 diff --git a/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_5.jsonl b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5f2383a612297ac9312c3f30fc444e1e1bec6f74 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/examples.4b284b84bc4seed4_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cae11310c58316710ba0957bc2f86e68d98e03f47c7ddd0e55615a7adb628c69 +size 13897515 diff --git a/4b284b84bc4seed4/evaluation/generation/merged.csv b/4b284b84bc4seed4/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..fd1ee3ca9265d8fc36d0558911b623df7a99ca11 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.007854709999230764 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.007854709999230764 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.17753845874321364 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.17753845874321364 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.21441790403427352 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.21441790403427352 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.2242096802521301 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.2242096802521301 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.22808412145632054 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.22808412145632054 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.22264024747277225 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.22264024747277225 +e2e_nlg_cleaned,5,average,multiple,0.17912418699299013 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.043691698777011345 +gem_xsum,0,median,rouge2_fmeasure,0.043691698777011345 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.03725757946128431 +gem_xsum,1,median,rouge2_fmeasure,0.03725757946128431 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.03757086142902083 +gem_xsum,2,median,rouge2_fmeasure,0.03757086142902083 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.037348548046976356 +gem_xsum,3,median,rouge2_fmeasure,0.037348548046976356 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.010923150617633553 +gem_xsum,4,median,rouge2_fmeasure,0.010923150617633553 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.0006098723079855157 +gem_xsum,5,median,rouge2_fmeasure,0.0006098723079855157 +gem_xsum,5,average,multiple,0.027900285106651986 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.050108480283474685 +web_nlg_en,0,median,rouge2_fmeasure,0.050108480283474685 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.05255280813689339 +web_nlg_en,1,median,rouge2_fmeasure,0.05255280813689339 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.05396475791939589 +web_nlg_en,2,median,rouge2_fmeasure,0.05396475791939589 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.05374249345557979 +web_nlg_en,3,median,rouge2_fmeasure,0.05374249345557979 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.05567978816710457 +web_nlg_en,4,median,rouge2_fmeasure,0.05567978816710457 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.05592752125205284 +web_nlg_en,5,median,rouge2_fmeasure,0.05592752125205284 +web_nlg_en,5,average,multiple,0.05366264153575019 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.0358183863771304 +wiki_lingua_en,0,median,rouge2_fmeasure,0.0358183863771304 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.061675743964392724 +wiki_lingua_en,1,median,rouge2_fmeasure,0.061675743964392724 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.06423744493296574 +wiki_lingua_en,2,median,rouge2_fmeasure,0.06423744493296574 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.05098365238098847 +wiki_lingua_en,3,median,rouge2_fmeasure,0.05098365238098847 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.01571321711438463 +wiki_lingua_en,4,median,rouge2_fmeasure,0.01571321711438463 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.002509211412713389 +wiki_lingua_en,5,median,rouge2_fmeasure,0.002509211412713389 +wiki_lingua_en,5,average,multiple,0.038489609363762556 diff --git a/4b284b84bc4seed4/evaluation/generation/merged.json b/4b284b84bc4seed4/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..b90d0662412c31db5bd00e10bd69fea1e67b601e --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.3523277002277804, "bleu_stderr": 0.03261401734869028, "rouge1_fmeasure": 0.10590846249521367, "rouge1_fmeasure_stderr": 0.0020195315762052673, "rouge1_precision": 0.07140357303785742, "rouge1_precision_stderr": 0.0017735064753741127, "rouge1_recall": 0.2938068811232804, "rouge1_recall_stderr": 0.004698591443703581, "rouge2_fmeasure": 0.050108480283474685, "rouge2_fmeasure_stderr": 0.0012479824947943812, "rouge2_precision": 0.033440949253294806, "rouge2_precision_stderr": 0.001066168691596413, "rouge2_recall": 0.14239106266330545, "rouge2_recall_stderr": 0.003163086494032039, "rougeL_fmeasure": 0.10246592063839631, "rougeL_fmeasure_stderr": 0.0018904079137483055, "rougeL_precision": 0.06888442229810386, "rougeL_precision_stderr": 0.001675844279268184, "rougeL_recall": 0.2866580974880424, "rougeL_recall_stderr": 0.004577594263202556, "rougeLsum_fmeasure": 0.10120297741035127, "rougeLsum_fmeasure_stderr": 0.0018969772318448463, "rougeLsum_precision": 0.06827936311686421, "rougeLsum_precision_stderr": 0.001698555616698455, "rougeLsum_recall": 0.28107278592336027, "rougeLsum_recall_stderr": 0.004438130822299941}}, "1": {"PALM_prompt": {"bleu": 0.4351779771917347, "bleu_stderr": 0.03461044967042056, "rouge1_fmeasure": 0.11195633719029822, "rouge1_fmeasure_stderr": 0.0017956976300324953, "rouge1_precision": 0.07162194662437592, "rouge1_precision_stderr": 0.0013087409774892172, "rouge1_recall": 0.3606308247426329, "rouge1_recall_stderr": 0.005204874863706004, "rouge2_fmeasure": 0.05255280813689339, "rouge2_fmeasure_stderr": 0.0011567693373819863, "rouge2_precision": 0.03355406237669093, "rouge2_precision_stderr": 0.0008232466042918183, "rouge2_recall": 0.17649806895632947, "rouge2_recall_stderr": 0.003573445474921975, "rougeL_fmeasure": 0.10647953810824176, "rougeL_fmeasure_stderr": 0.0016760663905838954, "rougeL_precision": 0.06810242914702684, "rougeL_precision_stderr": 0.0012110333378022905, "rougeL_recall": 0.34048847512021524, "rougeL_recall_stderr": 0.004750749477340653, "rougeLsum_fmeasure": 0.10693711806502432, "rougeLsum_fmeasure_stderr": 0.0017046988764721166, "rougeLsum_precision": 0.06848895184352013, "rougeLsum_precision_stderr": 0.0012480162482644015, "rougeLsum_recall": 0.3429613098536967, "rougeLsum_recall_stderr": 0.004820988766109633}}, "2": {"PALM_prompt": {"bleu": 0.4447149214180348, "bleu_stderr": 0.018972548555560714, "rouge1_fmeasure": 0.11462405866857102, "rouge1_fmeasure_stderr": 0.001736014539262953, "rouge1_precision": 0.07269992209256788, "rouge1_precision_stderr": 0.0012516992696440586, "rouge1_recall": 0.3753121304840736, "rouge1_recall_stderr": 0.0050439493858917194, "rouge2_fmeasure": 0.05396475791939589, "rouge2_fmeasure_stderr": 0.001107305452781615, "rouge2_precision": 0.03404844764438817, "rouge2_precision_stderr": 0.0007680445086395626, "rouge2_recall": 0.1879602254006144, "rouge2_recall_stderr": 0.003710463717182471, "rougeL_fmeasure": 0.10775063055928252, "rougeL_fmeasure_stderr": 0.0015887580065971389, "rougeL_precision": 0.06834435101252613, "rougeL_precision_stderr": 0.0011410779513936623, "rougeL_recall": 0.350761541750936, "rougeL_recall_stderr": 0.0045336528849166365, "rougeLsum_fmeasure": 0.10926127364577738, "rougeLsum_fmeasure_stderr": 0.0016390081021653892, "rougeLsum_precision": 0.06935895852997251, "rougeLsum_precision_stderr": 0.0011852302620070257, "rougeLsum_recall": 0.3565184552784119, "rougeLsum_recall_stderr": 0.004687409183137695}}, "3": {"PALM_prompt": {"bleu": 0.5087674664658492, "bleu_stderr": 0.026893638286752154, "rouge1_fmeasure": 0.11467972816113098, "rouge1_fmeasure_stderr": 0.001673200203783686, "rouge1_precision": 0.072497531691811, "rouge1_precision_stderr": 0.0012026919993320111, "rouge1_recall": 0.38474435436270493, "rouge1_recall_stderr": 0.005142183312772921, "rouge2_fmeasure": 0.05374249345557979, "rouge2_fmeasure_stderr": 0.0010894570854945713, "rouge2_precision": 0.03380876275906201, "rouge2_precision_stderr": 0.0007518942865145289, "rouge2_recall": 0.19155642039509754, "rouge2_recall_stderr": 0.0037517387263905507, "rougeL_fmeasure": 0.10704454572486424, "rougeL_fmeasure_stderr": 0.0015340338132748832, "rougeL_precision": 0.06774922502819766, "rougeL_precision_stderr": 0.0011043288246760676, "rougeL_recall": 0.355788174091109, "rougeL_recall_stderr": 0.004543365107062434, "rougeLsum_fmeasure": 0.10908169881982438, "rougeLsum_fmeasure_stderr": 0.0015837111282973452, "rougeLsum_precision": 0.06899862406820627, "rougeLsum_precision_stderr": 0.0011409968694109725, "rougeLsum_recall": 0.36454854774413287, "rougeLsum_recall_stderr": 0.004741615558398587}}, "4": {"PALM_prompt": {"bleu": 0.5913746773860721, "bleu_stderr": 0.041085758656651254, "rouge1_fmeasure": 0.11862510680315241, "rouge1_fmeasure_stderr": 0.0016779930474832658, "rouge1_precision": 0.07471728852529957, "rouge1_precision_stderr": 0.00120444126407064, "rouge1_recall": 0.4024992804481891, "rouge1_recall_stderr": 0.005245342121017829, "rouge2_fmeasure": 0.05567978816710457, "rouge2_fmeasure_stderr": 0.0010718834740964826, "rouge2_precision": 0.0348700360833608, "rouge2_precision_stderr": 0.0007408153164874413, "rouge2_recall": 0.2036124062513765, "rouge2_recall_stderr": 0.00387597600568855, "rougeL_fmeasure": 0.10913463867270404, "rougeL_fmeasure_stderr": 0.0015113181951666658, "rougeL_precision": 0.06888490676353087, "rougeL_precision_stderr": 0.0010959048971556757, "rougeL_recall": 0.3672784960986926, "rougeL_recall_stderr": 0.004566861844635672, "rougeLsum_fmeasure": 0.11255292648692071, "rougeLsum_fmeasure_stderr": 0.0015868430386374208, "rougeLsum_precision": 0.07096869733176525, "rougeLsum_precision_stderr": 0.0011452901218571788, "rougeLsum_recall": 0.3804621853389486, "rougeLsum_recall_stderr": 0.00482918129805665}}, "5": {"PALM_prompt": {"bleu": 0.6304604966593631, "bleu_stderr": 0.03484982021747957, "rouge1_fmeasure": 0.11884850755997649, "rouge1_fmeasure_stderr": 0.001616705319256009, "rouge1_precision": 0.0744328271529154, "rouge1_precision_stderr": 0.001157549734274375, "rouge1_recall": 0.4127612356762462, "rouge1_recall_stderr": 0.0052523273943021025, "rouge2_fmeasure": 0.05592752125205284, "rouge2_fmeasure_stderr": 0.0010528579472296477, "rouge2_precision": 0.03482016206562085, "rouge2_precision_stderr": 0.0007258016003322981, "rouge2_recall": 0.20894584695108945, "rouge2_recall_stderr": 0.0038600278798887723, "rougeL_fmeasure": 0.1090677963632186, "rougeL_fmeasure_stderr": 0.0014765997700889857, "rougeL_precision": 0.0684803394428656, "rougeL_precision_stderr": 0.0010698339353882353, "rougeL_recall": 0.3750129978505135, "rougeL_recall_stderr": 0.004543607982881679, "rougeLsum_fmeasure": 0.11288876880831, "rougeLsum_fmeasure_stderr": 0.0015402308170382386, "rougeLsum_precision": 0.07077155348314326, "rougeLsum_precision_stderr": 0.0011076088583072189, "rougeLsum_recall": 0.3900673103247878, "rougeLsum_recall_stderr": 0.0048425468419916184}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.5421125542141876, "bleu_stderr": 0.05756547176107712, "rouge1_fmeasure": 0.17708913864416292, "rouge1_fmeasure_stderr": 0.0018212193534322709, "rouge1_precision": 0.15130222816102726, "rouge1_precision_stderr": 0.0018641353605878376, "rouge1_recall": 0.2585048040019072, "rouge1_recall_stderr": 0.0026633037296359954, "rouge2_fmeasure": 0.0358183863771304, "rouge2_fmeasure_stderr": 0.00084133860800268, "rouge2_precision": 0.030354095195740356, "rouge2_precision_stderr": 0.0007454497776331851, "rouge2_recall": 0.05433811946884532, "rouge2_recall_stderr": 0.0014397669916064314, "rougeL_fmeasure": 0.1395967400507796, "rougeL_fmeasure_stderr": 0.001313393024815337, "rougeL_precision": 0.11775252929311998, "rougeL_precision_stderr": 0.0013049047450472628, "rougeL_recall": 0.20864111880992672, "rougeL_recall_stderr": 0.002169509233782621, "rougeLsum_fmeasure": 0.16174636673799278, "rougeLsum_fmeasure_stderr": 0.0016649134344973989, "rougeLsum_precision": 0.13805300047109062, "rougeLsum_precision_stderr": 0.0017010449743815584, "rougeLsum_recall": 0.23676218222386985, "rougeLsum_recall_stderr": 0.002462862595699301}}, "1": {"tldr_en": {"bleu": 3.1118566247604162, "bleu_stderr": 0.062088508469292286, "rouge1_fmeasure": 0.23390150161377168, "rouge1_fmeasure_stderr": 0.0020117545140889465, "rouge1_precision": 0.2194647051475106, "rouge1_precision_stderr": 0.0026637127905829957, "rouge1_recall": 0.32953538987527364, "rouge1_recall_stderr": 0.0029752735913270213, "rouge2_fmeasure": 0.061675743964392724, "rouge2_fmeasure_stderr": 0.0011660228294911223, "rouge2_precision": 0.060079962682567656, "rouge2_precision_stderr": 0.0015430426704356244, "rouge2_recall": 0.08864081298208347, "rouge2_recall_stderr": 0.0018541652458318118, "rougeL_fmeasure": 0.1623726890739185, "rougeL_fmeasure_stderr": 0.0013550604960878186, "rougeL_precision": 0.1539694016100103, "rougeL_precision_stderr": 0.0020721550784059055, "rougeL_recall": 0.23350379059815546, "rougeL_recall_stderr": 0.002302352375151091, "rougeLsum_fmeasure": 0.21928618412182982, "rougeLsum_fmeasure_stderr": 0.0018889547156816118, "rougeLsum_precision": 0.20602533584010463, "rougeLsum_precision_stderr": 0.00254117072503622, "rougeLsum_recall": 0.30941435638814363, "rougeLsum_recall_stderr": 0.0028218530563501962}}, "2": {"tldr_en": {"bleu": 3.3250803512114917, "bleu_stderr": 0.043720151005010505, "rouge1_fmeasure": 0.23819401638529333, "rouge1_fmeasure_stderr": 0.001961472755718473, "rouge1_precision": 0.21230058363878315, "rouge1_precision_stderr": 0.0024080619207750963, "rouge1_recall": 0.34134579643295393, "rouge1_recall_stderr": 0.00287291808958866, "rouge2_fmeasure": 0.06423744493296574, "rouge2_fmeasure_stderr": 0.0011237343652403928, "rouge2_precision": 0.058180340769663996, "rouge2_precision_stderr": 0.0012366998672630046, "rouge2_recall": 0.09448704160727436, "rouge2_recall_stderr": 0.0018410055564769775, "rougeL_fmeasure": 0.16572553377575022, "rougeL_fmeasure_stderr": 0.0013269375688079502, "rougeL_precision": 0.14716839436847945, "rougeL_precision_stderr": 0.001723324637255188, "rougeL_recall": 0.24371061167078392, "rougeL_recall_stderr": 0.002305940409051167, "rougeLsum_fmeasure": 0.22428067952847994, "rougeLsum_fmeasure_stderr": 0.001853122562183745, "rougeLsum_precision": 0.19985650365773666, "rougeLsum_precision_stderr": 0.0022791002962553927, "rougeLsum_recall": 0.32205265894357177, "rougeLsum_recall_stderr": 0.0027492000000614377}}, "3": {"tldr_en": {"bleu": 3.264795684563816, "bleu_stderr": 0.0665539830427249, "rouge1_fmeasure": 0.19371662716809854, "rouge1_fmeasure_stderr": 0.002332163732000944, "rouge1_precision": 0.1759676944241637, "rouge1_precision_stderr": 0.002599503777933057, "rouge1_recall": 0.2783528249629676, "rouge1_recall_stderr": 0.003439775464191638, "rouge2_fmeasure": 0.05098365238098847, "rouge2_fmeasure_stderr": 0.0010739239370527816, "rouge2_precision": 0.04672040323211839, "rouge2_precision_stderr": 0.0011635414202250617, "rouge2_recall": 0.07600165390612795, "rouge2_recall_stderr": 0.0018062659171568973, "rougeL_fmeasure": 0.13757683764937148, "rougeL_fmeasure_stderr": 0.0016125055112952101, "rougeL_precision": 0.12481870305727255, "rougeL_precision_stderr": 0.0018681974052869646, "rougeL_recall": 0.2032107116074926, "rougeL_recall_stderr": 0.0026995788494260085, "rougeLsum_fmeasure": 0.18265210486261796, "rougeLsum_fmeasure_stderr": 0.002199082319355358, "rougeLsum_precision": 0.165693431417505, "rougeLsum_precision_stderr": 0.0024409611879563638, "rougeLsum_recall": 0.26318808414968303, "rougeLsum_recall_stderr": 0.0032807386039732994}}, "4": {"tldr_en": {"bleu": 0.7399731218010301, "bleu_stderr": 0.05315913015718361, "rouge1_fmeasure": 0.061810069279221835, "rouge1_fmeasure_stderr": 0.002050884974045622, "rouge1_precision": 0.05753559661305722, "rouge1_precision_stderr": 0.002138715660683914, "rouge1_recall": 0.0930047418871661, "rouge1_recall_stderr": 0.0031434712495670048, "rouge2_fmeasure": 0.01571321711438463, "rouge2_fmeasure_stderr": 0.000725772297710108, "rouge2_precision": 0.014474681217716064, "rouge2_precision_stderr": 0.0008323203723133832, "rouge2_recall": 0.025504176001051017, "rouge2_recall_stderr": 0.001303289046442984, "rougeL_fmeasure": 0.04536102247912932, "rougeL_fmeasure_stderr": 0.001487864376367666, "rougeL_precision": 0.042660119298722994, "rougeL_precision_stderr": 0.0016477900120572672, "rougeL_recall": 0.06969950422653938, "rougeL_recall_stderr": 0.0024116366945608377, "rougeLsum_fmeasure": 0.058117132916654005, "rougeLsum_fmeasure_stderr": 0.0019249371066501861, "rougeLsum_precision": 0.05421281196909096, "rougeLsum_precision_stderr": 0.002025499714973123, "rougeLsum_recall": 0.08758632873317065, "rougeLsum_recall_stderr": 0.0029650946931968555}}, "5": {"tldr_en": {"bleu": 1.7124193494262821e-06, "bleu_stderr": 3.2741945230754847e-06, "rouge1_fmeasure": 0.009774296059399336, "rouge1_fmeasure_stderr": 0.0009080621408899851, "rouge1_precision": 0.009165990245767591, "rouge1_precision_stderr": 0.0009442979407312777, "rouge1_recall": 0.015418596799201417, "rouge1_recall_stderr": 0.0015077442548408681, "rouge2_fmeasure": 0.002509211412713389, "rouge2_fmeasure_stderr": 0.0003022299477574736, "rouge2_precision": 0.0023451269499108907, "rouge2_precision_stderr": 0.00034470873041317335, "rouge2_recall": 0.0046018834347627035, "rouge2_recall_stderr": 0.0006803082985888496, "rougeL_fmeasure": 0.00720761001914484, "rougeL_fmeasure_stderr": 0.0006681163091531024, "rougeL_precision": 0.00678359535997039, "rougeL_precision_stderr": 0.0007097335601922828, "rougeL_recall": 0.011572236419649438, "rougeL_recall_stderr": 0.0011572136947999466, "rougeLsum_fmeasure": 0.00912075895864339, "rougeLsum_fmeasure_stderr": 0.0008473674103987658, "rougeLsum_precision": 0.008486993163393306, "rougeLsum_precision_stderr": 0.0008690259306885085, "rougeLsum_recall": 0.014459769727609291, "rougeLsum_recall_stderr": 0.0014158078041286931}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 0.05808891716691411, "bleu_stderr": 0.011333330592580656, "rouge1_fmeasure": 0.13899147577262666, "rouge1_fmeasure_stderr": 0.0009286294871679315, "rouge1_precision": 0.3023091414929599, "rouge1_precision_stderr": 0.002913887406749905, "rouge1_recall": 0.12238985523242189, "rouge1_recall_stderr": 0.0013610627775538216, "rouge2_fmeasure": 0.007854709999230764, "rouge2_fmeasure_stderr": 0.00036516539565493495, "rouge2_precision": 0.022775128205128368, "rouge2_precision_stderr": 0.0011384359586054489, "rouge2_recall": 0.00610855031631702, "rouge2_recall_stderr": 0.0002896485948013325, "rougeL_fmeasure": 0.1275827225198627, "rougeL_fmeasure_stderr": 0.0008841123038167355, "rougeL_precision": 0.2745392561803429, "rougeL_precision_stderr": 0.002727571611712019, "rougeL_recall": 0.11483479288312695, "rougeL_recall_stderr": 0.0013803318617414532, "rougeLsum_fmeasure": 0.12203235569838602, "rougeLsum_fmeasure_stderr": 0.0009202893055765295, "rougeLsum_precision": 0.27555523169576246, "rougeLsum_precision_stderr": 0.002926670520914391, "rougeLsum_recall": 0.1020509279394632, "rougeLsum_recall_stderr": 0.0009751330314082834}}, "1": {"generate_text_restaurant": {"bleu": 8.932841105621064, "bleu_stderr": 0.11441707444147597, "rouge1_fmeasure": 0.3974228957995462, "rouge1_fmeasure_stderr": 0.002320429553502724, "rouge1_precision": 0.44530595662757727, "rouge1_precision_stderr": 0.0036595275413873183, "rouge1_recall": 0.42827303768403047, "rouge1_recall_stderr": 0.0030343030656821836, "rouge2_fmeasure": 0.17753845874321364, "rouge2_fmeasure_stderr": 0.0018327497034708936, "rouge2_precision": 0.20230936163095836, "rouge2_precision_stderr": 0.0025036401909577727, "rouge2_recall": 0.19120188941717492, "rouge2_recall_stderr": 0.00210380636425424, "rougeL_fmeasure": 0.2971909218049089, "rougeL_fmeasure_stderr": 0.0018836069812237484, "rougeL_precision": 0.33275929259548276, "rougeL_precision_stderr": 0.00295993230865274, "rougeL_recall": 0.32342830006561096, "rougeL_recall_stderr": 0.002557175371249573, "rougeLsum_fmeasure": 0.3253556432256207, "rougeLsum_fmeasure_stderr": 0.0022142373615418754, "rougeLsum_precision": 0.36536808388203507, "rougeLsum_precision_stderr": 0.0033140674546694128, "rougeLsum_recall": 0.35017983210590575, "rougeLsum_recall_stderr": 0.0027753545840717682}}, "2": {"generate_text_restaurant": {"bleu": 11.880063105811095, "bleu_stderr": 0.17984450139554475, "rouge1_fmeasure": 0.44505676798399185, "rouge1_fmeasure_stderr": 0.0022811968446148742, "rouge1_precision": 0.506737464401302, "rouge1_precision_stderr": 0.0035936965647612898, "rouge1_recall": 0.45038732838216006, "rouge1_recall_stderr": 0.0028591739786909026, "rouge2_fmeasure": 0.21441790403427352, "rouge2_fmeasure_stderr": 0.0019873610836182685, "rouge2_precision": 0.24833021143506717, "rouge2_precision_stderr": 0.002726123256626373, "rouge2_recall": 0.2167301855181476, "rouge2_recall_stderr": 0.002197696079985957, "rougeL_fmeasure": 0.33281096535989263, "rougeL_fmeasure_stderr": 0.002027510114174692, "rougeL_precision": 0.37992704007005046, "rougeL_precision_stderr": 0.0030781300319706554, "rougeL_recall": 0.337552347296149, "rougeL_recall_stderr": 0.0024789904236623512, "rougeLsum_fmeasure": 0.3722406759710508, "rougeLsum_fmeasure_stderr": 0.002269175188375031, "rougeLsum_precision": 0.4242330670183315, "rougeLsum_precision_stderr": 0.0033488862052480383, "rougeLsum_recall": 0.3763581811094256, "rougeLsum_recall_stderr": 0.002695938632190225}}, "3": {"generate_text_restaurant": {"bleu": 12.520921591661882, "bleu_stderr": 0.2718380639604944, "rouge1_fmeasure": 0.4521518805319402, "rouge1_fmeasure_stderr": 0.0022515279038786227, "rouge1_precision": 0.5070856834398472, "rouge1_precision_stderr": 0.003526888789046483, "rouge1_recall": 0.45723976171215824, "rouge1_recall_stderr": 0.0027704797956913073, "rouge2_fmeasure": 0.2242096802521301, "rouge2_fmeasure_stderr": 0.002021997464706373, "rouge2_precision": 0.255120829295647, "rouge2_precision_stderr": 0.0027246646455271546, "rouge2_recall": 0.2268268997863891, "rouge2_recall_stderr": 0.002237190631242654, "rougeL_fmeasure": 0.3385818879988679, "rougeL_fmeasure_stderr": 0.002056019295521777, "rougeL_precision": 0.3810377463717816, "rougeL_precision_stderr": 0.00307213165006003, "rougeL_recall": 0.3423151690624315, "rougeL_recall_stderr": 0.002416743374863738, "rougeLsum_fmeasure": 0.38189174321776803, "rougeLsum_fmeasure_stderr": 0.002258684314720834, "rougeLsum_precision": 0.4285263610786833, "rougeLsum_precision_stderr": 0.003304605518552052, "rougeLsum_recall": 0.38610636284479233, "rougeLsum_recall_stderr": 0.002654435476507776}}, "4": {"generate_text_restaurant": {"bleu": 12.831367617602877, "bleu_stderr": 0.18248133751970383, "rouge1_fmeasure": 0.45672550688868757, "rouge1_fmeasure_stderr": 0.002254562843922049, "rouge1_precision": 0.5008213879398539, "rouge1_precision_stderr": 0.003448214786347665, "rouge1_recall": 0.4677552019051495, "rouge1_recall_stderr": 0.0027487310914847602, "rouge2_fmeasure": 0.22808412145632054, "rouge2_fmeasure_stderr": 0.0020391687587871005, "rouge2_precision": 0.252653067142654, "rouge2_precision_stderr": 0.0026728213400761492, "rouge2_recall": 0.23421861425493357, "rouge2_recall_stderr": 0.0022616561003861407, "rougeL_fmeasure": 0.34183112110248615, "rougeL_fmeasure_stderr": 0.002088453787987109, "rougeL_precision": 0.3751971515131376, "rougeL_precision_stderr": 0.002976831493826089, "rougeL_recall": 0.35072100299356046, "rougeL_recall_stderr": 0.0024722233464228543, "rougeLsum_fmeasure": 0.3886135908143339, "rougeLsum_fmeasure_stderr": 0.0022942589711889686, "rougeLsum_precision": 0.42516588170775854, "rougeLsum_precision_stderr": 0.00322080090809883, "rougeLsum_recall": 0.39902571740048054, "rougeLsum_recall_stderr": 0.002736668954410199}}, "5": {"generate_text_restaurant": {"bleu": 12.476649044527553, "bleu_stderr": 0.1698766854636743, "rouge1_fmeasure": 0.45208098619239717, "rouge1_fmeasure_stderr": 0.002213005671732147, "rouge1_precision": 0.4839633098425305, "rouge1_precision_stderr": 0.003299267823766779, "rouge1_recall": 0.4705499697275458, "rouge1_recall_stderr": 0.002738242144292685, "rouge2_fmeasure": 0.22264024747277225, "rouge2_fmeasure_stderr": 0.001987296116486491, "rouge2_precision": 0.24091846485732277, "rouge2_precision_stderr": 0.0025436868155710828, "rouge2_recall": 0.2320394354997667, "rouge2_recall_stderr": 0.0022071751737241835, "rougeL_fmeasure": 0.3385274428827769, "rougeL_fmeasure_stderr": 0.0020319683310434395, "rougeL_precision": 0.3629543396997906, "rougeL_precision_stderr": 0.0028393546604920366, "rougeL_recall": 0.35264832664365503, "rougeL_recall_stderr": 0.0024261289166555506, "rougeLsum_fmeasure": 0.38655176446890444, "rougeLsum_fmeasure_stderr": 0.0022484585467573517, "rougeLsum_precision": 0.4137754251875113, "rougeLsum_precision_stderr": 0.003126258632288186, "rougeLsum_recall": 0.40238964616699796, "rougeLsum_recall_stderr": 0.002661265077082012}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.9125252340175696, "bleu_stderr": 0.0939254181938478, "rouge1_fmeasure": 0.20307234782166939, "rouge1_fmeasure_stderr": 0.00254398638712588, "rouge1_precision": 0.15896903592047174, "rouge1_precision_stderr": 0.002308498075214904, "rouge1_recall": 0.32151606833527474, "rouge1_recall_stderr": 0.004467750436406024, "rouge2_fmeasure": 0.043691698777011345, "rouge2_fmeasure_stderr": 0.0015720363515098195, "rouge2_precision": 0.03326326936108637, "rouge2_precision_stderr": 0.0013115215791441866, "rouge2_recall": 0.07276812864417066, "rouge2_recall_stderr": 0.00266495974490086, "rougeL_fmeasure": 0.15593841528849953, "rougeL_fmeasure_stderr": 0.0019887757192407814, "rougeL_precision": 0.12182880371774332, "rougeL_precision_stderr": 0.001818918777245228, "rougeL_recall": 0.24834119210557543, "rougeL_recall_stderr": 0.0035628091512773206, "rougeLsum_fmeasure": 0.15748185679405513, "rougeLsum_fmeasure_stderr": 0.002117052212384048, "rougeLsum_precision": 0.1227952289626782, "rougeLsum_precision_stderr": 0.0018764392535370118, "rougeLsum_recall": 0.2516810661517101, "rougeLsum_recall_stderr": 0.0038501177791414915}}, "1": {"article_DOC_summary": {"bleu": 1.4234140719501784, "bleu_stderr": 0.08008244099582335, "rouge1_fmeasure": 0.17438840171489733, "rouge1_fmeasure_stderr": 0.002516782211263018, "rouge1_precision": 0.12456796192309169, "rouge1_precision_stderr": 0.0018663225428676555, "rouge1_recall": 0.3033782811263302, "rouge1_recall_stderr": 0.00435632341852972, "rouge2_fmeasure": 0.03725757946128431, "rouge2_fmeasure_stderr": 0.001453910826534785, "rouge2_precision": 0.026297340000885697, "rouge2_precision_stderr": 0.001027838408615643, "rouge2_recall": 0.06688789749645495, "rouge2_recall_stderr": 0.0027125026315894404, "rougeL_fmeasure": 0.14307994211588798, "rougeL_fmeasure_stderr": 0.002005379862853747, "rougeL_precision": 0.10198505059076171, "rougeL_precision_stderr": 0.0014701582863370355, "rougeL_recall": 0.2506401563563098, "rougeL_recall_stderr": 0.003651091960508788, "rougeLsum_fmeasure": 0.1353866489423388, "rougeLsum_fmeasure_stderr": 0.0020762039106271024, "rougeLsum_precision": 0.09637711275571659, "rougeLsum_precision_stderr": 0.0015128974074199704, "rougeLsum_recall": 0.23772290217746403, "rougeLsum_recall_stderr": 0.0037666734496558294}}, "2": {"article_DOC_summary": {"bleu": 1.403058154138598, "bleu_stderr": 0.07947986565662277, "rouge1_fmeasure": 0.17150651760394497, "rouge1_fmeasure_stderr": 0.0023907265926706956, "rouge1_precision": 0.12257166429044594, "rouge1_precision_stderr": 0.0017758091493012137, "rouge1_recall": 0.2978206183170451, "rouge1_recall_stderr": 0.004153358896452572, "rouge2_fmeasure": 0.03757086142902083, "rouge2_fmeasure_stderr": 0.0014307603878365935, "rouge2_precision": 0.02653075423531747, "rouge2_precision_stderr": 0.0010100537686758024, "rouge2_recall": 0.06731490725572081, "rouge2_recall_stderr": 0.002670773143935172, "rougeL_fmeasure": 0.14604747569954757, "rougeL_fmeasure_stderr": 0.0020129836183947333, "rougeL_precision": 0.10424146003543594, "rougeL_precision_stderr": 0.001484600288621153, "rougeL_recall": 0.25471602692648093, "rougeL_recall_stderr": 0.003610349405448802, "rougeLsum_fmeasure": 0.13155136268487863, "rougeLsum_fmeasure_stderr": 0.0019833919805789246, "rougeLsum_precision": 0.09373790710180954, "rougeLsum_precision_stderr": 0.0014469445596197233, "rougeLsum_recall": 0.23028725682485185, "rougeLsum_recall_stderr": 0.0035926993484314182}}, "3": {"article_DOC_summary": {"bleu": 1.4860485963618193, "bleu_stderr": 0.09363961497980915, "rouge1_fmeasure": 0.1664704853916206, "rouge1_fmeasure_stderr": 0.00250451940953418, "rouge1_precision": 0.12212159195548629, "rouge1_precision_stderr": 0.0020413508418911223, "rouge1_recall": 0.28379290430795073, "rouge1_recall_stderr": 0.004300429318890937, "rouge2_fmeasure": 0.037348548046976356, "rouge2_fmeasure_stderr": 0.0014490141107738803, "rouge2_precision": 0.027086922588921557, "rouge2_precision_stderr": 0.0010893085545950853, "rouge2_recall": 0.06560470949712288, "rouge2_recall_stderr": 0.0025928364606295586, "rougeL_fmeasure": 0.14204750890662055, "rougeL_fmeasure_stderr": 0.0021403616377412287, "rougeL_precision": 0.10394812833382235, "rougeL_precision_stderr": 0.0017256599090190122, "rougeL_recall": 0.24318873056030976, "rougeL_recall_stderr": 0.0037594406422229213, "rougeLsum_fmeasure": 0.12846242652343276, "rougeLsum_fmeasure_stderr": 0.0020450420326324982, "rougeLsum_precision": 0.09419477661930503, "rougeLsum_precision_stderr": 0.0016768519118452933, "rougeLsum_recall": 0.22033465049587264, "rougeLsum_recall_stderr": 0.003618847956030538}}, "4": {"article_DOC_summary": {"bleu": 0.8326562560108917, "bleu_stderr": 0.1467525734431667, "rouge1_fmeasure": 0.047356647789818455, "rouge1_fmeasure_stderr": 0.002748168768611129, "rouge1_precision": 0.041843850057486254, "rouge1_precision_stderr": 0.0027248704585387203, "rouge1_recall": 0.07170804112417602, "rouge1_recall_stderr": 0.0041857327071730364, "rouge2_fmeasure": 0.010923150617633553, "rouge2_fmeasure_stderr": 0.001018598314862772, "rouge2_precision": 0.00975684909437077, "rouge2_precision_stderr": 0.0010812973230085907, "rouge2_recall": 0.016640859698859974, "rouge2_recall_stderr": 0.0015451158301785048, "rougeL_fmeasure": 0.03990722372366724, "rougeL_fmeasure_stderr": 0.002276301239159138, "rougeL_precision": 0.03544031461665562, "rougeL_precision_stderr": 0.002305692160527795, "rougeL_recall": 0.06079313428910594, "rougeL_recall_stderr": 0.0035266276653790293, "rougeLsum_fmeasure": 0.036847659155334334, "rougeLsum_fmeasure_stderr": 0.0021765624675524546, "rougeLsum_precision": 0.03328647749360134, "rougeLsum_precision_stderr": 0.0022740307934491265, "rougeLsum_recall": 0.0556921853671952, "rougeLsum_recall_stderr": 0.003318230068428034}}, "5": {"article_DOC_summary": {"bleu": 5.230211901475508e-35, "bleu_stderr": 5.134007383899523e-30, "rouge1_fmeasure": 0.0028438767697741185, "rouge1_fmeasure_stderr": 0.0008091353860408605, "rouge1_precision": 0.003243188732265197, "rouge1_precision_stderr": 0.0009910456520478602, "rouge1_recall": 0.0026536470502779067, "rouge1_recall_stderr": 0.0007340423451228517, "rouge2_fmeasure": 0.0006098723079855157, "rouge2_fmeasure_stderr": 0.0003241318837354033, "rouge2_precision": 0.0007579961658762991, "rouge2_precision_stderr": 0.0004164644743745851, "rouge2_recall": 0.0005294862370334068, "rouge2_recall_stderr": 0.00028364001336350907, "rougeL_fmeasure": 0.0022743929327468044, "rougeL_fmeasure_stderr": 0.0006386166431455819, "rougeL_precision": 0.002549580362974837, "rougeL_precision_stderr": 0.0007512133719590526, "rougeL_recall": 0.0021600686497647045, "rougeL_recall_stderr": 0.0006036544336792427, "rougeLsum_fmeasure": 0.0025220053356973726, "rougeLsum_fmeasure_stderr": 0.0007351598994991656, "rougeLsum_precision": 0.0028617335261268903, "rougeLsum_precision_stderr": 0.0008958933741864754, "rougeLsum_recall": 0.0023705346379101037, "rougeLsum_recall_stderr": 0.0006744765626606669}}}} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..b96802a824a85290f749f76a396a4f5f83ec3ba9 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3523277002277804, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03261401734869028 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07140357303785742, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0017735064753741127 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2938068811232804, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004698591443703581 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10590846249521367, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020195315762052673 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.033440949253294806, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001066168691596413 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.14239106266330545, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003163086494032039 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.050108480283474685, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012479824947943812 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06888442229810386, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001675844279268184 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2866580974880424, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004577594263202556 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10246592063839631, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018904079137483055 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06827936311686421, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001698555616698455 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.28107278592336027, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004438130822299941 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10120297741035127, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018969772318448463 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..a5a2e146cf33e4c217c331322aab7b89f9248440 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4351779771917347, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03461044967042056 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07162194662437592, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013087409774892172 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3606308247426329, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005204874863706004 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11195633719029822, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017956976300324953 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03355406237669093, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008232466042918183 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.17649806895632947, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003573445474921975 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05255280813689339, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011567693373819863 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06810242914702684, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012110333378022905 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.34048847512021524, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004750749477340653 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10647953810824176, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016760663905838954 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06848895184352013, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012480162482644015 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3429613098536967, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004820988766109633 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10693711806502432, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017046988764721166 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..bee22df9cc3b53fb2d789f5e549bee07ad8ee4a5 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4447149214180348, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.018972548555560714 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07269992209256788, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012516992696440586 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3753121304840736, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0050439493858917194 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11462405866857102, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001736014539262953 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03404844764438817, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007680445086395626 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1879602254006144, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003710463717182471 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05396475791939589, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001107305452781615 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06834435101252613, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011410779513936623 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.350761541750936, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0045336528849166365 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10775063055928252, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015887580065971389 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06935895852997251, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011852302620070257 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3565184552784119, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004687409183137695 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10926127364577738, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016390081021653892 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..8366b9e7cd9afc61f1409ecc5d5053ac79be0f40 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5087674664658492, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.026893638286752154 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.072497531691811, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012026919993320111 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.38474435436270493, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005142183312772921 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11467972816113098, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001673200203783686 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03380876275906201, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007518942865145289 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19155642039509754, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0037517387263905507 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05374249345557979, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010894570854945713 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06774922502819766, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011043288246760676 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.355788174091109, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004543365107062434 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10704454572486424, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015340338132748832 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06899862406820627, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011409968694109725 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.36454854774413287, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004741615558398587 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10908169881982438, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015837111282973452 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..166dd8b44c834676e99e29de17746ffb271bdfef --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5913746773860721, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.041085758656651254 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07471728852529957, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.00120444126407064 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4024992804481891, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005245342121017829 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11862510680315241, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016779930474832658 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.0348700360833608, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007408153164874413 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2036124062513765, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00387597600568855 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05567978816710457, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010718834740964826 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06888490676353087, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010959048971556757 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3672784960986926, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004566861844635672 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10913463867270404, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015113181951666658 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07096869733176525, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011452901218571788 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3804621853389486, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00482918129805665 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11255292648692071, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015868430386374208 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..af5632bfcab6c8ba77b2a413271adc6dfad3c427 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6304604966593631, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03484982021747957 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0744328271529154, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001157549734274375 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.4127612356762462, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0052523273943021025 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11884850755997649, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001616705319256009 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03482016206562085, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007258016003322981 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20894584695108945, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038600278798887723 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05592752125205284, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010528579472296477 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.0684803394428656, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010698339353882353 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3750129978505135, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004543607982881679 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1090677963632186, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014765997700889857 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07077155348314326, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011076088583072189 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3900673103247878, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0048425468419916184 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11288876880831, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015402308170382386 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..913858d20b77cca51c4767c4e2794e5a0da4c39f --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15130222816102726, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018641353605878376 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2585048040019072, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0026633037296359954 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17708913864416292, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018212193534322709 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.030354095195740356, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007454497776331851 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05433811946884532, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014397669916064314 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0358183863771304, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00084133860800268 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11775252929311998, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013049047450472628 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.20864111880992672, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002169509233782621 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1395967400507796, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001313393024815337 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13805300047109062, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017010449743815584 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.23676218222386985, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002462862595699301 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16174636673799278, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016649134344973989 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5421125542141876, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05756547176107712 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1cb92730a8631c117345d5c67f655be6980c714a --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.2194647051475106, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0026637127905829957 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.32953538987527364, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0029752735913270213 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.23390150161377168, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020117545140889465 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.060079962682567656, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0015430426704356244 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.08864081298208347, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0018541652458318118 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.061675743964392724, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011660228294911223 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1539694016100103, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0020721550784059055 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.23350379059815546, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002302352375151091 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1623726890739185, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013550604960878186 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.20602533584010463, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.00254117072503622 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.30941435638814363, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0028218530563501962 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.21928618412182982, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018889547156816118 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.1118566247604162, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.062088508469292286 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..80e0917b94991b3672cf8254bc79ea3d46cc48da --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.21230058363878315, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0024080619207750963 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.34134579643295393, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00287291808958866 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.23819401638529333, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001961472755718473 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.058180340769663996, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0012366998672630046 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.09448704160727436, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0018410055564769775 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.06423744493296574, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011237343652403928 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.14716839436847945, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001723324637255188 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.24371061167078392, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002305940409051167 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.16572553377575022, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013269375688079502 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.19985650365773666, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0022791002962553927 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.32205265894357177, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027492000000614377 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.22428067952847994, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001853122562183745 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.3250803512114917, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.043720151005010505 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..5f7dc9285fac0aa30f7b4fbafbcf6118c0f20535 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1759676944241637, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002599503777933057 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2783528249629676, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.003439775464191638 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.19371662716809854, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002332163732000944 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04672040323211839, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011635414202250617 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.07600165390612795, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0018062659171568973 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05098365238098847, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010739239370527816 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.12481870305727255, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0018681974052869646 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.2032107116074926, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0026995788494260085 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13757683764937148, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016125055112952101 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.165693431417505, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0024409611879563638 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.26318808414968303, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0032807386039732994 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.18265210486261796, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002199082319355358 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.264795684563816, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0665539830427249 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b324d638cddcfe74b4ec0f940304df845521f1a0 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.05753559661305722, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002138715660683914 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.0930047418871661, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0031434712495670048 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.061810069279221835, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002050884974045622 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.014474681217716064, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008323203723133832 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.025504176001051017, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001303289046442984 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.01571321711438463, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000725772297710108 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.042660119298722994, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0016477900120572672 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.06969950422653938, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0024116366945608377 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.04536102247912932, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001487864376367666 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.05421281196909096, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002025499714973123 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.08758632873317065, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0029650946931968555 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.058117132916654005, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019249371066501861 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.7399731218010301, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05315913015718361 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..fb67ed72d93cf229bfe24fc13427ce9187d8b63f --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.009165990245767591, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0009442979407312777 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.015418596799201417, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0015077442548408681 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.009774296059399336, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0009080621408899851 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0023451269499108907, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00034470873041317335 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0046018834347627035, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0006803082985888496 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.002509211412713389, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0003022299477574736 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.00678359535997039, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0007097335601922828 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.011572236419649438, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0011572136947999466 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.00720761001914484, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006681163091531024 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.008486993163393306, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0008690259306885085 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.014459769727609291, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0014158078041286931 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.00912075895864339, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0008473674103987658 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.7124193494262821e-06, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 3.2741945230754847e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..8470f104247ed541607e2743b917d5fa27f3571d --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.05808891716691411, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.011333330592580656 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3023091414929599, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002913887406749905 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.12238985523242189, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0013610627775538216 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.13899147577262666, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0009286294871679315 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.022775128205128368, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0011384359586054489 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.00610855031631702, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0002896485948013325 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.007854709999230764, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.00036516539565493495 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2745392561803429, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002727571611712019 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.11483479288312695, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0013803318617414532 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.1275827225198627, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0008841123038167355 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.27555523169576246, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002926670520914391 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.1020509279394632, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0009751330314082834 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.12203235569838602, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0009202893055765295 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..55a4dd9c2f309698bf982c3b59c1592fec5d35f3 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 8.932841105621064, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.11441707444147597 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.44530595662757727, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0036595275413873183 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.42827303768403047, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0030343030656821836 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3974228957995462, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002320429553502724 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.20230936163095836, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0025036401909577727 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.19120188941717492, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.00210380636425424 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.17753845874321364, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018327497034708936 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.33275929259548276, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.00295993230865274 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.32342830006561096, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002557175371249573 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2971909218049089, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0018836069812237484 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.36536808388203507, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0033140674546694128 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.35017983210590575, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027753545840717682 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3253556432256207, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022142373615418754 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..1219933717c56cfbb1a956176062c21e0084a412 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.880063105811095, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.17984450139554475 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.506737464401302, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0035936965647612898 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.45038732838216006, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028591739786909026 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.44505676798399185, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022811968446148742 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.24833021143506717, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002726123256626373 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2167301855181476, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002197696079985957 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.21441790403427352, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0019873610836182685 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.37992704007005046, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0030781300319706554 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.337552347296149, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024789904236623512 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.33281096535989263, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002027510114174692 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4242330670183315, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0033488862052480383 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3763581811094256, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002695938632190225 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3722406759710508, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002269175188375031 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..58936c342f3f7620ece4de125adc913faac72b98 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.520921591661882, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.2718380639604944 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5070856834398472, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003526888789046483 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.45723976171215824, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027704797956913073 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4521518805319402, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022515279038786227 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.255120829295647, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027246646455271546 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2268268997863891, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002237190631242654 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2242096802521301, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002021997464706373 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3810377463717816, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.00307213165006003 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3423151690624315, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002416743374863738 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3385818879988679, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002056019295521777 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4285263610786833, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003304605518552052 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.38610636284479233, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002654435476507776 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.38189174321776803, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002258684314720834 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ae02cfda80b207baeeefecd35840d921385edc88 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.831367617602877, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.18248133751970383 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5008213879398539, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003448214786347665 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4677552019051495, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027487310914847602 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.45672550688868757, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002254562843922049 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.252653067142654, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0026728213400761492 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.23421861425493357, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022616561003861407 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.22808412145632054, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0020391687587871005 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3751971515131376, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002976831493826089 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.35072100299356046, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024722233464228543 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34183112110248615, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002088453787987109 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.42516588170775854, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.00322080090809883 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.39902571740048054, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002736668954410199 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3886135908143339, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022942589711889686 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..f61e7259c498a6b604e08cbd53834e10f7b750f9 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.476649044527553, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1698766854636743 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4839633098425305, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003299267823766779 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4705499697275458, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002738242144292685 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.45208098619239717, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002213005671732147 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.24091846485732277, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0025436868155710828 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2320394354997667, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022071751737241835 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.22264024747277225, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001987296116486491 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3629543396997906, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0028393546604920366 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.35264832664365503, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024261289166555506 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3385274428827769, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0020319683310434395 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4137754251875113, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003126258632288186 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.40238964616699796, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002661265077082012 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.38655176446890444, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022484585467573517 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_0.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..160a218bb7b3723d198df847faedb824850f9e90 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.15896903592047174, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002308498075214904 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.32151606833527474, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004467750436406024 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20307234782166939, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.00254398638712588 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03326326936108637, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0013115215791441866 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07276812864417066, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00266495974490086 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.043691698777011345, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0015720363515098195 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.12182880371774332, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001818918777245228 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24834119210557543, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0035628091512773206 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.15593841528849953, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019887757192407814 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.1227952289626782, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0018764392535370118 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2516810661517101, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0038501177791414915 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.15748185679405513, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002117052212384048 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.9125252340175696, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0939254181938478 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_1.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c81794c56480474a88ebd1289d14cb9d06b43caf --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12456796192309169, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018663225428676555 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3033782811263302, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.00435632341852972 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17438840171489733, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002516782211263018 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.026297340000885697, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.001027838408615643 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06688789749645495, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027125026315894404 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03725757946128431, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001453910826534785 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10198505059076171, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0014701582863370355 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2506401563563098, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003651091960508788 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14307994211588798, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002005379862853747 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09637711275571659, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0015128974074199704 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23772290217746403, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0037666734496558294 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1353866489423388, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020762039106271024 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4234140719501784, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08008244099582335 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_2.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..821ed63b119c9db7294b7da8a84eb15deca33939 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12257166429044594, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017758091493012137 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2978206183170451, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004153358896452572 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17150651760394497, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0023907265926706956 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02653075423531747, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010100537686758024 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06731490725572081, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002670773143935172 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03757086142902083, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014307603878365935 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10424146003543594, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001484600288621153 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.25471602692648093, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003610349405448802 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14604747569954757, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020129836183947333 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09373790710180954, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014469445596197233 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23028725682485185, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0035926993484314182 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13155136268487863, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019833919805789246 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.403058154138598, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07947986565662277 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_3.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..2ccb77788e56eaf3d61e812aeace5fc745bdb138 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12212159195548629, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0020413508418911223 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.28379290430795073, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004300429318890937 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1664704853916206, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.00250451940953418 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.027086922588921557, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010893085545950853 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06560470949712288, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0025928364606295586 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.037348548046976356, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014490141107738803 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10394812833382235, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0017256599090190122 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24318873056030976, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0037594406422229213 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14204750890662055, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0021403616377412287 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09419477661930503, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016768519118452933 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.22033465049587264, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003618847956030538 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.12846242652343276, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020450420326324982 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4860485963618193, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09363961497980915 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_4.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..543fbc679fc7e2071f00c67b00622b5985e96bd9 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.041843850057486254, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0027248704585387203 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.07170804112417602, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0041857327071730364 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.047356647789818455, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002748168768611129 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.00975684909437077, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010812973230085907 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.016640859698859974, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0015451158301785048 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.010923150617633553, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001018598314862772 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.03544031461665562, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.002305692160527795 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.06079313428910594, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0035266276653790293 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.03990722372366724, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.002276301239159138 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.03328647749360134, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0022740307934491265 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0556921853671952, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003318230068428034 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.036847659155334334, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021765624675524546 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.8326562560108917, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.1467525734431667 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_5.json b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..e08f3711ed1413ccdd303c69a1ce93aaee614d5b --- /dev/null +++ b/4b284b84bc4seed4/evaluation/generation/slim.4b284b84bc4seed4_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.003243188732265197, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0009910456520478602 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0026536470502779067, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0007340423451228517 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.0028438767697741185, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0008091353860408605 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0007579961658762991, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0004164644743745851 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0005294862370334068, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00028364001336350907 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0006098723079855157, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0003241318837354033 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.002549580362974837, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0007512133719590526 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0021600686497647045, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0006036544336792427 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0022743929327468044, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0006386166431455819 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0028617335261268903, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0008958933741864754 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0023705346379101037, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0006744765626606669 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0025220053356973726, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0007351598994991656 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 5.230211901475508e-35, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 5.134007383899523e-30 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b84bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_0.csv b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..98683b3a154a37e0e48b0e97690b0cd724f896c6 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.335,0.014933117490932575,0 +anli_r2,acc,0.333,0.01491084616422986,0 +anli_r3,acc,0.33416666666666667,0.013622434813136781,0 +arc_challenge,acc,0.2619453924914676,0.012849054826858115,0 +arc_challenge,acc_norm,0.29180887372013653,0.013284525292403508,0 +arc_easy,acc,0.5888047138047138,0.010096663811817681,0 +arc_easy,acc_norm,0.5197811447811448,0.010251751199542738,0 +boolq,acc,0.5984709480122324,0.008573784490094752,1 +cb,acc,0.42857142857142855,0.06672848092813058,1 +cb,f1,0.21956970232832299,,1 +copa,acc,0.68,0.046882617226215034,0 +hellaswag,acc,0.4700258912567218,0.00498080723113675,0 +hellaswag,acc_norm,0.6167098187612029,0.00485194417067125,0 +piqa,acc,0.7519042437431991,0.010077118315574719,0 +piqa,acc_norm,0.7568008705114254,0.01000961195385892,0 +rte,acc,0.5270758122743683,0.030052303463143706,0 +sciq,acc,0.845,0.01145015747079947,0 +sciq,acc_norm,0.766,0.01339490288966001,0 +storycloze_2016,acc,0.7167290219134153,0.010419760409155363,0 +winogrande,acc,0.595895816890292,0.013791610664670858,0 diff --git a/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_0.json b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_0.json new file mode 100644 index 0000000000000000000000000000000000000000..85229f19d22a231d76dfe395801fffabd19f76f0 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.335, + "acc_stderr": 0.014933117490932575 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.01491084616422986 + }, + "anli_r3": { + "acc": 0.33416666666666667, + "acc_stderr": 0.013622434813136781 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.21956970232832299 + }, + "copa": { + "acc": 0.68, + "acc_stderr": 0.046882617226215034 + }, + "hellaswag": { + "acc": 0.4700258912567218, + "acc_stderr": 0.00498080723113675, + "acc_norm": 0.6167098187612029, + "acc_norm_stderr": 0.00485194417067125 + }, + "rte": { + "acc": 0.5270758122743683, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.595895816890292, + "acc_stderr": 0.013791610664670858 + }, + "storycloze_2016": { + "acc": 0.7167290219134153, + "acc_stderr": 0.010419760409155363 + }, + "boolq": { + "acc": 0.5984709480122324, + "acc_stderr": 0.008573784490094752 + }, + "arc_easy": { + "acc": 0.5888047138047138, + "acc_stderr": 0.010096663811817681, + "acc_norm": 0.5197811447811448, + "acc_norm_stderr": 0.010251751199542738 + }, + "arc_challenge": { + "acc": 0.2619453924914676, + "acc_stderr": 0.012849054826858115, + "acc_norm": 0.29180887372013653, + "acc_norm_stderr": 0.013284525292403508 + }, + "sciq": { + "acc": 0.845, + "acc_stderr": 0.01145015747079947, + "acc_norm": 0.766, + "acc_norm_stderr": 0.01339490288966001 + }, + "piqa": { + "acc": 0.7519042437431991, + "acc_stderr": 0.010077118315574719, + "acc_norm": 0.7568008705114254, + "acc_norm_stderr": 0.01000961195385892 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_1.csv b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..d8915e8b4508d47a4b54a480fa9c8bb7ff46e90a --- /dev/null +++ b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.326,0.014830507204541037,0 +anli_r2,acc,0.334,0.014922019523732961,0 +anli_r3,acc,0.3258333333333333,0.013535422043417455,0 +arc_challenge,acc,0.28242320819112626,0.013155456884097224,0 +arc_challenge,acc_norm,0.3097269624573379,0.013512058415238361,0 +arc_easy,acc,0.6212121212121212,0.009953737656542037,0 +arc_easy,acc_norm,0.5829124579124579,0.010117738967781986,0 +boolq,acc,0.6045871559633027,0.008551600109082904,1 +cb,acc,0.48214285714285715,0.0673769750864465,1 +cb,f1,0.33001107419712067,,1 +copa,acc,0.75,0.04351941398892446,0 +hellaswag,acc,0.4678350926110337,0.004979446038824758,0 +hellaswag,acc_norm,0.6130252937661821,0.0048606237334611405,0 +piqa,acc,0.7453754080522307,0.010164432237060492,0 +piqa,acc_norm,0.7595212187159956,0.009971345364651064,0 +rte,acc,0.5451263537906137,0.029973636495415255,0 +sciq,acc,0.888,0.009977753031397234,0 +sciq,acc_norm,0.862,0.010912152632504401,0 +storycloze_2016,acc,0.7097808658471406,0.010495529690730063,0 +winogrande,acc,0.585635359116022,0.013844846232268563,0 diff --git a/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_1.json b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_1.json new file mode 100644 index 0000000000000000000000000000000000000000..b0d6b295e098da4656aba434ee46ec480641bcbc --- /dev/null +++ b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.326, + "acc_stderr": 0.014830507204541037 + }, + "anli_r2": { + "acc": 0.334, + "acc_stderr": 0.014922019523732961 + }, + "anli_r3": { + "acc": 0.3258333333333333, + "acc_stderr": 0.013535422043417455 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.33001107419712067 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.4678350926110337, + "acc_stderr": 0.004979446038824758, + "acc_norm": 0.6130252937661821, + "acc_norm_stderr": 0.0048606237334611405 + }, + "rte": { + "acc": 0.5451263537906137, + "acc_stderr": 0.029973636495415255 + }, + "winogrande": { + "acc": 0.585635359116022, + "acc_stderr": 0.013844846232268563 + }, + "storycloze_2016": { + "acc": 0.7097808658471406, + "acc_stderr": 0.010495529690730063 + }, + "boolq": { + "acc": 0.6045871559633027, + "acc_stderr": 0.008551600109082904 + }, + "arc_easy": { + "acc": 0.6212121212121212, + "acc_stderr": 0.009953737656542037, + "acc_norm": 0.5829124579124579, + "acc_norm_stderr": 0.010117738967781986 + }, + "arc_challenge": { + "acc": 0.28242320819112626, + "acc_stderr": 0.013155456884097224, + "acc_norm": 0.3097269624573379, + "acc_norm_stderr": 0.013512058415238361 + }, + "sciq": { + "acc": 0.888, + "acc_stderr": 0.009977753031397234, + "acc_norm": 0.862, + "acc_norm_stderr": 0.010912152632504401 + }, + "piqa": { + "acc": 0.7453754080522307, + "acc_stderr": 0.010164432237060492, + "acc_norm": 0.7595212187159956, + "acc_norm_stderr": 0.009971345364651064 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_2.csv b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..61229bc84d46b7cd946d32d92cdd1d4022eda083 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.331,0.014888272588203931,0 +anli_r2,acc,0.329,0.014865395385928369,0 +anli_r3,acc,0.3416666666666667,0.013696658778002512,0 +arc_challenge,acc,0.2909556313993174,0.013273077865907578,0 +arc_challenge,acc_norm,0.3165529010238908,0.013592431519068079,0 +arc_easy,acc,0.6292087542087542,0.009911292822056925,0 +arc_easy,acc_norm,0.6047979797979798,0.01003189405279098,0 +boolq,acc,0.6073394495412844,0.008541161248702913,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.2951144094001237,,1 +copa,acc,0.74,0.04408440022768079,0 +hellaswag,acc,0.4667396932881896,0.0049787293000748915,0 +hellaswag,acc_norm,0.6128261302529376,0.004861084534087031,0 +piqa,acc,0.7464635473340587,0.01015009083455179,0 +piqa,acc_norm,0.7557127312295974,0.01002476517228425,0 +rte,acc,0.5306859205776173,0.030039730592197812,0 +sciq,acc,0.904,0.009320454434783215,0 +sciq,acc_norm,0.881,0.010244215145336666,0 +storycloze_2016,acc,0.7194013896312133,0.01038980964728882,0 +winogrande,acc,0.5895816890292028,0.013825107120035863,0 diff --git a/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_2.json b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_2.json new file mode 100644 index 0000000000000000000000000000000000000000..4a5b3ce9478188ea64b99e5e817e7700f9099bf2 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.331, + "acc_stderr": 0.014888272588203931 + }, + "anli_r2": { + "acc": 0.329, + "acc_stderr": 0.014865395385928369 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002512 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.2951144094001237 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.04408440022768079 + }, + "hellaswag": { + "acc": 0.4667396932881896, + "acc_stderr": 0.0049787293000748915, + "acc_norm": 0.6128261302529376, + "acc_norm_stderr": 0.004861084534087031 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.030039730592197812 + }, + "winogrande": { + "acc": 0.5895816890292028, + "acc_stderr": 0.013825107120035863 + }, + "storycloze_2016": { + "acc": 0.7194013896312133, + "acc_stderr": 0.01038980964728882 + }, + "boolq": { + "acc": 0.6073394495412844, + "acc_stderr": 0.008541161248702913 + }, + "arc_easy": { + "acc": 0.6292087542087542, + "acc_stderr": 0.009911292822056925, + "acc_norm": 0.6047979797979798, + "acc_norm_stderr": 0.01003189405279098 + }, + "arc_challenge": { + "acc": 0.2909556313993174, + "acc_stderr": 0.013273077865907578, + "acc_norm": 0.3165529010238908, + "acc_norm_stderr": 0.013592431519068079 + }, + "sciq": { + "acc": 0.904, + "acc_stderr": 0.009320454434783215, + "acc_norm": 0.881, + "acc_norm_stderr": 0.010244215145336666 + }, + "piqa": { + "acc": 0.7464635473340587, + "acc_stderr": 0.01015009083455179, + "acc_norm": 0.7557127312295974, + "acc_norm_stderr": 0.01002476517228425 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_3.csv b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..88948b16562ae3af569d1e78beb7cba4cf809b91 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.327,0.014842213153411237,0 +anli_r2,acc,0.322,0.014782913600996667,0 +anli_r3,acc,0.3441666666666667,0.013720551062295756,0 +arc_challenge,acc,0.29180887372013653,0.013284525292403501,0 +arc_challenge,acc_norm,0.3165529010238908,0.01359243151906808,0 +arc_easy,acc,0.6287878787878788,0.00991359900184574,0 +arc_easy,acc_norm,0.6153198653198653,0.009983171707009008,0 +boolq,acc,0.6107033639143731,0.008528016290984541,1 +cb,acc,0.5178571428571429,0.06737697508644647,1 +cb,f1,0.4381559220389805,,1 +copa,acc,0.78,0.04163331998932263,0 +hellaswag,acc,0.4671380203146783,0.004978992721242829,0 +hellaswag,acc_norm,0.6192989444333798,0.004845668799108534,0 +piqa,acc,0.7551686615886833,0.010032309105568798,0 +piqa,acc_norm,0.7633297062023939,0.009916841655042809,0 +rte,acc,0.5270758122743683,0.030052303463143706,0 +sciq,acc,0.902,0.009406619184621223,0 +sciq,acc_norm,0.889,0.009938701010583726,0 +storycloze_2016,acc,0.7183324425440941,0.010401844358587667,0 +winogrande,acc,0.5872138910812944,0.013837060648682089,0 diff --git a/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_3.json b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_3.json new file mode 100644 index 0000000000000000000000000000000000000000..3fc3fa234a95bbcc8390c0094e652b020004bd0f --- /dev/null +++ b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.327, + "acc_stderr": 0.014842213153411237 + }, + "anli_r2": { + "acc": 0.322, + "acc_stderr": 0.014782913600996667 + }, + "anli_r3": { + "acc": 0.3441666666666667, + "acc_stderr": 0.013720551062295756 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.4381559220389805 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932263 + }, + "hellaswag": { + "acc": 0.4671380203146783, + "acc_stderr": 0.004978992721242829, + "acc_norm": 0.6192989444333798, + "acc_norm_stderr": 0.004845668799108534 + }, + "rte": { + "acc": 0.5270758122743683, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.5872138910812944, + "acc_stderr": 0.013837060648682089 + }, + "storycloze_2016": { + "acc": 0.7183324425440941, + "acc_stderr": 0.010401844358587667 + }, + "boolq": { + "acc": 0.6107033639143731, + "acc_stderr": 0.008528016290984541 + }, + "arc_easy": { + "acc": 0.6287878787878788, + "acc_stderr": 0.00991359900184574, + "acc_norm": 0.6153198653198653, + "acc_norm_stderr": 0.009983171707009008 + }, + "arc_challenge": { + "acc": 0.29180887372013653, + "acc_stderr": 0.013284525292403501, + "acc_norm": 0.3165529010238908, + "acc_norm_stderr": 0.01359243151906808 + }, + "sciq": { + "acc": 0.902, + "acc_stderr": 0.009406619184621223, + "acc_norm": 0.889, + "acc_norm_stderr": 0.009938701010583726 + }, + "piqa": { + "acc": 0.7551686615886833, + "acc_stderr": 0.010032309105568798, + "acc_norm": 0.7633297062023939, + "acc_norm_stderr": 0.009916841655042809 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_4.csv b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..c1ee8235d27da4b74e6840a9db8b5fcf1fe5bcef --- /dev/null +++ b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.342,0.015008706182121731,0 +anli_r2,acc,0.329,0.014865395385928367,0 +anli_r3,acc,0.32666666666666666,0.013544340907003663,0 +arc_challenge,acc,0.29180887372013653,0.013284525292403492,0 +arc_challenge,acc_norm,0.31569965870307165,0.013582571095815291,0 +arc_easy,acc,0.6266835016835017,0.00992500914280291,0 +arc_easy,acc_norm,0.6153198653198653,0.009983171707009,0 +boolq,acc,0.6162079510703364,0.008505584729104973,1 +cb,acc,0.5892857142857143,0.0663363415035954,1 +cb,f1,0.4120234604105572,,1 +copa,acc,0.77,0.04229525846816507,0 +hellaswag,acc,0.4666401115315674,0.004978662946687269,0 +hellaswag,acc_norm,0.6238797052380004,0.004834207964061318,0 +piqa,acc,0.750816104461371,0.010091882770120216,0 +piqa,acc_norm,0.7611534276387377,0.009948120385337484,0 +rte,acc,0.5018050541516246,0.030096267148976626,0 +sciq,acc,0.907,0.00918887563499668,0 +sciq,acc_norm,0.9,0.00949157995752505,0 +storycloze_2016,acc,0.7242116515232496,0.010334748387645674,0 +winogrande,acc,0.590370955011839,0.013821049109655483,0 diff --git a/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_4.json b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_4.json new file mode 100644 index 0000000000000000000000000000000000000000..c70b87522a4a482e6f58aa21b3aac0c208b65657 --- /dev/null +++ b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.342, + "acc_stderr": 0.015008706182121731 + }, + "anli_r2": { + "acc": 0.329, + "acc_stderr": 0.014865395385928367 + }, + "anli_r3": { + "acc": 0.32666666666666666, + "acc_stderr": 0.013544340907003663 + }, + "cb": { + "acc": 0.5892857142857143, + "acc_stderr": 0.0663363415035954, + "f1": 0.4120234604105572 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816507 + }, + "hellaswag": { + "acc": 0.4666401115315674, + "acc_stderr": 0.004978662946687269, + "acc_norm": 0.6238797052380004, + "acc_norm_stderr": 0.004834207964061318 + }, + "rte": { + "acc": 0.5018050541516246, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.590370955011839, + "acc_stderr": 0.013821049109655483 + }, + "storycloze_2016": { + "acc": 0.7242116515232496, + "acc_stderr": 0.010334748387645674 + }, + "boolq": { + "acc": 0.6162079510703364, + "acc_stderr": 0.008505584729104973 + }, + "arc_easy": { + "acc": 0.6266835016835017, + "acc_stderr": 0.00992500914280291, + "acc_norm": 0.6153198653198653, + "acc_norm_stderr": 0.009983171707009 + }, + "arc_challenge": { + "acc": 0.29180887372013653, + "acc_stderr": 0.013284525292403492, + "acc_norm": 0.31569965870307165, + "acc_norm_stderr": 0.013582571095815291 + }, + "sciq": { + "acc": 0.907, + "acc_stderr": 0.00918887563499668, + "acc_norm": 0.9, + "acc_norm_stderr": 0.00949157995752505 + }, + "piqa": { + "acc": 0.750816104461371, + "acc_stderr": 0.010091882770120216, + "acc_norm": 0.7611534276387377, + "acc_norm_stderr": 0.009948120385337484 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_5.csv b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..b65b88a93b56c3b2067e3dbfabcc9e904ab25c5b --- /dev/null +++ b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.344,0.015029633724408943,0 +anli_r2,acc,0.326,0.01483050720454104,0 +anli_r3,acc,0.36083333333333334,0.01386918025244486,0 +arc_challenge,acc,0.30631399317406144,0.013470584417276511,0 +arc_challenge,acc_norm,0.3225255972696246,0.013659980894277373,0 +arc_easy,acc,0.6334175084175084,0.009887786585323946,0 +arc_easy,acc_norm,0.617003367003367,0.009974920384536482,0 +boolq,acc,0.617737003058104,0.008499149690449273,1 +cb,acc,0.6428571428571429,0.06460957383809221,1 +cb,f1,0.4430260047281324,,1 +copa,acc,0.76,0.04292346959909282,0 +hellaswag,acc,0.466938856801434,0.004978861409119807,0 +hellaswag,acc_norm,0.6233817964548894,0.0048354759576109425,0 +piqa,acc,0.7448313384113167,0.010171571592521822,0 +piqa,acc_norm,0.7616974972796517,0.009940334245876219,0 +rte,acc,0.5667870036101083,0.02982676408213827,0 +sciq,acc,0.909,0.009099549538400243,0 +sciq,acc_norm,0.903,0.009363689373248125,0 +storycloze_2016,acc,0.7284874398717264,0.010284547617192592,0 +winogrande,acc,0.6029992107340174,0.0137510925198067,0 diff --git a/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_5.json b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_5.json new file mode 100644 index 0000000000000000000000000000000000000000..7be98ed73019d144370f12f7420e8ff4f6db620a --- /dev/null +++ b/4b284b84bc4seed4/evaluation/rankeval/4b284b84bc4seed4_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.344, + "acc_stderr": 0.015029633724408943 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.01483050720454104 + }, + "anli_r3": { + "acc": 0.36083333333333334, + "acc_stderr": 0.01386918025244486 + }, + "cb": { + "acc": 0.6428571428571429, + "acc_stderr": 0.06460957383809221, + "f1": 0.4430260047281324 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909282 + }, + "hellaswag": { + "acc": 0.466938856801434, + "acc_stderr": 0.004978861409119807, + "acc_norm": 0.6233817964548894, + "acc_norm_stderr": 0.0048354759576109425 + }, + "rte": { + "acc": 0.5667870036101083, + "acc_stderr": 0.02982676408213827 + }, + "winogrande": { + "acc": 0.6029992107340174, + "acc_stderr": 0.0137510925198067 + }, + "storycloze_2016": { + "acc": 0.7284874398717264, + "acc_stderr": 0.010284547617192592 + }, + "boolq": { + "acc": 0.617737003058104, + "acc_stderr": 0.008499149690449273 + }, + "arc_easy": { + "acc": 0.6334175084175084, + "acc_stderr": 0.009887786585323946, + "acc_norm": 0.617003367003367, + "acc_norm_stderr": 0.009974920384536482 + }, + "arc_challenge": { + "acc": 0.30631399317406144, + "acc_stderr": 0.013470584417276511, + "acc_norm": 0.3225255972696246, + "acc_norm_stderr": 0.013659980894277373 + }, + "sciq": { + "acc": 0.909, + "acc_stderr": 0.009099549538400243, + "acc_norm": 0.903, + "acc_norm_stderr": 0.009363689373248125 + }, + "piqa": { + "acc": 0.7448313384113167, + "acc_stderr": 0.010171571592521822, + "acc_norm": 0.7616974972796517, + "acc_norm_stderr": 0.009940334245876219 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c7ded22535d69a0f1eca27855ba89b10117130b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d69739fbb2affaa0d201d9c42163c87e87bfc3327f85e3fd24963d34a1337434 +size 199058647 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ad61f749ad221e96ffe956bf575b236f133940c --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:005b2e6884e0f87cdaa7c74ca43e8975aa32955f946000e96a061d99bff1da8f +size 199058647 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f42ae531900b01aecf3fe6adf2e3d7aff54ed4be --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82114782a7574b6b99dee525a0959a9316c732da558677a8ae62791312a640da +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22636f47035449fd4453860a04994ef37fabef06 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d42c2645ffd9313d61035b7276393315b574844c36a31e1d0651851d75c8eedf +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f617e82054386bc378483c0d1465ad019cf7eb72 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:686b34d4c04cebe7bd7bd19a937cb215675e146bfabcf41fcabccd612d6d6fd2 +size 199058797 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..419b0ab4868a3a4992f23c105a026458f3a323aa --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e49fa9472831ea68afa6088d7a75f84befc68b9d2aa10fa59e304c3b6890242 +size 199058797 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2e3cd03e6f9d2c552996f0236e41a233d6be4c8 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2808b179ab2d1093e3c7ea7c1820afc238bf8c4b08a438af11b4db4537d24582 +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3130e687a990b2389a54cd256586efdc3c7e58d --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c256a639f0624e8e97c9efe11ba481ed03222bc2c61dae440de20dda2a190112 +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2492d0ea4a981e551ec0577d5c52e79c79d1335e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91ef5be84e9ca0e8bb436f3a0110b7ac897ea589fa36fb453b45c88666301c10 +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbcecc06a36182b5aaf85d8139163a23edc6c2ba --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:215fc4e935c627ffdc116c8cda2980740f1217584945657d414acc0115d8297d +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..612b47618c758828aabd68e8b6cea02a84c6b707 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:796b7967ee2e5adde309b44d7fb6186e996b8684bb008631723991bb19027c16 +size 199058797 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a977392a2e681680ce94708891292cfd9bb17120 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13f7e6133ae32c135ac1b3f290bc466e749bad04cbf498d7e80cd2280b743014 +size 199058797 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1436f2c27c8c9d6bd950cfdf08efb44c2d11188 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:333aff8b51a3aa5fc703b19c38d66030294be28206638bbeb49d54cdc613ef14 +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66e88f7d08419156be8e36288b482031b50f6a3b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:981c557254ed45e3a9a195f347df8051862b2d6ae687774316b47ea4f0ab7df1 +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdf43fb1a8c5f048569052240b149a6bb5d3ce1f --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a49deb94019f50bb4edf5285e83bef256136c2c2b0e15349de7e8e1cc0c98869 +size 199058669 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..228dab576ed51e8629a4bfcc3bc422b90ba62b4e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e19fe45af772af5973f5d96daaffe3ff2d85ab4cbd667e6fc0299b42ee2f5ee8 +size 199058669 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc9e5fea26694077c10ad00c5e9676ab6c9a311b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e8f7ca535b3329d749a75b9e7fd19eb33e8b0a06c8faa9047332cf0f36908b3 +size 199058797 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58c65f7c5eb9ab7571dd91733d18c2c73c615d66 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8cd940d6e206b38d69e2ed166dd27186837877bb332d1c79cdc1252f88e4493 +size 199058797 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7896d1e754c729cc66000142675c3b72bbad94e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:040bb180ca9857b3db598deb41f260cefd13824941e878ad570a557d3bf63e8e +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30a472f19d5b773bbe8239f4d13950015d52a083 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f7560473b5eb887956fe19ddbc6bca1e93e1be53c472b04070a5d11db20a5fc +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..649e4181e1f8eabc0adb9f865c997498ca4a9631 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10c30b8042dbcc6c7415cbb8d9272ad07afccf5692fd06dd4665cd182435654a +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f71b6d1538a1639a030badf42b63f8a5e1cd8b3e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24d31d3cd356cb76b36801d75c136f3c89ecac0703baa50381d5a00240eadb59 +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..226725470c9e59d1bd2fc782aae58c9b81ec576e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c08c9b2a78c6c0dcb199e35ca242388b516d94175abdea9686b59d49e8f824d +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96c8953281f734d9c95a8a810841dff727d153a3 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4777fc0c15f643f8919789b6d622c51a0fc8e5018d8fd8b84e9f716dc4289dcd +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7c0ae4268750d98da52e8302f22345daeb3cbe2 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fd99974eff52bd1ca2603c34d69457264f4cc5597b8ed5e18adb9a032b503c5 +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e93afa3874c1ded56fa65c6ee7030cd404b8cb3 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7050c6e1b0e9886c6467b0c9446bfca2094271916f245e915f7e07fd0ceaa186 +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67b4344df36e341e7bdebdb4a96d160db277f4e7 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b3e672931bf8c238a11c1b4eb5edb4ad7c703f399d8bd17900e7f01b8f74ab9 +size 199058797 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ca889150815de5876099ec99e3940505a415ed4 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b7fb5adf988b06c23aa570524ec3dd297e662fda7bb8252dfac8f5509e3785a +size 199058797 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38aaaf8bd39dd66e0f105bff5d6acfa480c41cf4 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19465270fa53ac4e62a49b8ab2654a7cd0049e8c92daf3534fd801412d82578b +size 199058605 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1758c7cc46e1875fdcfd7a60abad4660ae1c702a --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fec2c8894158cb6302861b2d9ac0b2f03163174fa289fc5ea7b7732da8a1d2a3 +size 199058605 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db7ee5990f56f62d9abc4a0190ce21c23bd6db17 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd2bf243d024acfeb52e999e26d360b5db1664538e9668645793c65da24e423e +size 199058669 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e8f81c13fc2ad292ace709f9431b9ec7e0511d2 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0654396890a08cc94a3d491534464345d3fce01405afe2fd9933ece3bb84092c +size 199058669 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e35c0db61eda6ccdbcb8196b7acc7330ec56cc6f --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:044fdf59d3ac10c101abfb500a52f97d4761c7b07235ddb4904299ac05a45c67 +size 199058797 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28fbd83e726a0b43f0e5c4bfefca1a6015784b9a --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d8f1e51109613d4c8b9f8549fd4ea2951658a43336a7277330973b970c23020 +size 199058797 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b71a810abd10be3f0e08999321b2238242313969 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:164fbda08f869edef782815d18f3c232d096f7990e5a04406f90e973d788e574 +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb99d462c2cc1f5e3aa09ef210d67ac88ae04a0b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38ca2e922c64a8f0ff4b00c5542a3c1484a1c7609da01959734f07bf76c05d84 +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55b293b8e5c22ff191bbc0ac0b6eae13c37be981 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dbb9be82b1f8cbec777e6cb17091a790c2754f0bd505749548aa4a7e119955f +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01d6cc9e713c46c7c37e7a241f6242e7f0324b89 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4abe909a40b2dd37ab294cf1c195772a6f82a42482c5d50cadf24470f8987bd +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dd059aec6aecfb567902bc2cdc8a55a1a2adc8b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be840eefc7b927f46236752bdcc38e4e59d2b010b0a1251a708f9e57cacd7ab1 +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be6edd2ff0ced654658d1688c9545b645ecb8318 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ded539efd951fe2680e35df882205ba0662e07dc551beebb8031370486bb9e3f +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f53aff5bc70c020251f5f693a87fe1f586ee5c59 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2319ed85169816613dd13ed9e2a0c7757e45d33eec71bfb96203ee31bbb3b523 +size 199058797 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07da48628b67ed058ec18455c9fa35d880e68a13 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c52ca3ddc162b753111e131219275c2f872a562259a5d8f2c5068d1956f0573 +size 199058797 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cb808ce8a2e14107519f91c9d36156a92b452d1 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cef0089cd1f9b62b4306ca29772a8310f62cacdb1b0a4728b5dafe18be636ac +size 199058669 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b08d0a9d3582f03df3e0281087d7115f9867751 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8fae4308555eeddaa3b3316e1af493e57ed8df95d71f2f682c633470c1eb17e +size 199058669 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..734e78056e3dde35e2956cafb4563bc936987b3c --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:339b7a0836068d2381f8f693bfa52f28a7e5176116e6b527f2b9389139cda72f +size 199058850 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..897e4b5997e572cee50626e61a3fbd81ece936f4 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09c4fa336435803134fdc3cdcab68082fdacb39f07f3dcbedad63486f1166d1b +size 199058850 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc6b306aac5b92aa14654110c067b0a57eb001dc --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1219b0906352b17944727427975038bba2cd0ce1bd42e0d56d6ae50eeb852df +size 199058669 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c760d6ae959c564bead0b9d85ccd46d1da3f6725 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a319beb5c6274e0845a81269327874f82b8ec110b2dead7a6e762d46a757a2b +size 199058669 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b29c63dad0dc796a6d916d1ca9483733d91cd4c --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae037458cb9a46757ab83a6a2acf07c5b7c7df662ea1ea61e293f09a4c5febad +size 199058797 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76e508eee0458f2ae265c4e04bad93fc529aa681 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bec982b5681db7b7a3718e1c4617f59d44736577587e0693dd6221719371e30 +size 199058797 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dd891fdf0ee27da038a13e764a64340d2d36fed --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd9d161491baf48f248dd2f6771a42c1f329584b3c1a98a37cde6685bf181c1c +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..354a81c68631c7bcea3b5b35e12a87673e12f884 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90423e3fa92907b438bac85f8c4ae22a386baac0b519a04a2a56275a9069f9be +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e61498c0ea3c994ab189953acfffa7178d7dfff9 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12b3e312faf6c72522d77e35b568d4b653f30d00090ba69989c6f41aa4abedc1 +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1d0100b7ac12b070b2deed22093c1a1a91a217d --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99f4fedd32a34a6c1ff79b2769458a45beb4ddcea2c8a587b54b1fb0f5c1146d +size 199058733 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c67a331940b4fc45555d747516684d4e9a06d34 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f84847db585c6ffc5e73c4e979d87e8ef51595fabe8515073ce36578161ffa89 +size 199058669 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe9aaef1d8e892a2693f6946e32350c4dd271b47 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c73ce5f2ac22afb7d90031077d362ca03a46d6793eebb75533689786e59175f +size 199058669 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b79994a0c7556d862f90b4d8d9ee20ed6dcf6ddf --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01839b0ef2f0b826e99d468b26adfcdd93593abb2c25324c70916937fe342648 +size 199058925 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eba24de73f402d60d2339c46525fdc6b2ac65f6a --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b12b8bc119eeb9a6935a5019b95cce474471240d1f0ef6d59ab4566cee37167 +size 199058925 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48ec5dc4fa31ccd6c00ab68d7e9b5810915a826e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cb065091d26ee3963f0f01c00572f8c4589ad39e08fe90e87cef978da861828 +size 199058605 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3e6424054fad88cb2b8029f949ae9a9671dbea9 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f5242cd577074316f85a7613977d91600f2902997b501e8bfb738f57245d578 +size 199058605 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4eba9f6d384054357492b3edd1424ef1ed81c8f9 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fefc5e100949a36acb1d20fea52e347ff57655e62f46bf35ba0d8de336dfbd3 +size 199058605 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b878e48081f5e245a0748d784934cce8e90e0f61 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3e9cb5d3e161de1d506e893c78f0a8bcf578aba89d1e1c9725994236a31f585 +size 199058605 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3d575798be1d6f56546f89aae5c74f0abf7352b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e48c2bd9298568b374aa45360eba05bb18fce35ca9b1e209ef9007873498ceac +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..921d74b1347e814be6047d12373b93a30a637de6 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67ffb28817a46faed81e5804e93cce9b9af1879df1493e83bffc68e907992e3b +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..191298c47306e2a0dbb73cdeca186408ac886841 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11615994b2a264b1254af9d520bd2c3057a8dea44e98d8058686710fabfd374d +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb6f1c67e48ebb2338cd91bba1fe6a666e50f9ce --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69547bc0344dafd035d99ac5c4c702429003365be63af8f0ad9fef677889328d +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..744e9f29eedb5b73126267ab39159eeee0dcd507 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3282e99ee24e58cd614d64d9d92dd89cc5c3fe116f960c4ee2592b2b8e936975 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cba6f0f68995f3d76c60e2836398cb692cc5627 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb71cb3daab0c78dd8a2335ed49bd1d3a14d694bb3726726c1eed7e06c9cff02 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c694c831327fd21962ce629ce6788dfc15c1894c --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b934ff169ecb5a84b737ace8a0085a7a0dbad1d5d715515482246799eda85616 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ba6ffdadaa2c7d6373f43b1c323da9c953c8cd5 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe604ca215093db8405bca1d79a71413c2616d3ff8d0a50fd26b0b7d3c634ef0 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4771fea31bf1ccf40d372ce52f2836d0ae5de6b1 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce5a7d1cac9b4e3852a5bfda3a064e3055261eb19a77f93c0340f5d45c09475d +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5a8ec98a34d2ca992b165735b55567c7692176e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae7cf8cf9692cf50e139698a6f3b28e29b2b8f159da1e78a1e2dee44ae399643 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50df76449fe364011b886b56911479b7a8d5c1ba --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dff9f1fdda08bcf83579bc039c23c0abdc88de3ca452e8945e3468c720c6fc3 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55b0afd11a4964aa932506245e0ced2c4086801a --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3640e66a767c4b0aded99513ab0aec7f8531d66c1cfcf282503a480a9e7b9005 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a9b55a26fac63fa1553a18c2668b74cb0b7dfd1 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ebb5ba46342b53100981a3de13dcdb8a318fdd5de30bdb5833afc2b118e9b78 +size 199058978 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..433eb1a431de1881e5a724fa60f54aee7c4d08f1 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a788063c85db307c79c395c8a180dc0d025776ce9089107cf1073dbe984c2ae +size 199058978 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b85d3c6d19f4da48d48104143429949e35c37b51 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfb358a836c464b8207c10d6d7c8d234ac9e5b90bfd0b32e9f3189122b3a708a +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c3b83d969459d6513e2b85cde81bf45340810a6 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75d21247e97eeff70f0e8a47d40e3e93575e32d67bc3b668b83d0fedf2e7bf0d +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6429491a1386d3fe365c1be41c87867b8c49f812 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f74136ef0eb05b5c58611fea27e59ca2207d0f496899068c49c91727584eb78 +size 199058647 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4fab7f9f1b7e4992eefd75ae8dbc27d063878ca --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de1435ba9ebaa5028a38aaef5b77e1f279957e6c9aaea79c3f54cca4933c8d88 +size 199058647 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c0d027be81258211f06e5368ce2bb638194b36f --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed09f89b5180798537be98d2940c67f4a8c225108a345f5ebc1e0cd8e2703b9f +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b855bd77bd57d532d1f029b8b3fbf655a3c523bc --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3663f91f3d67fbf769c027fea42b412cdc362a075c9c01b74be0c0a24be92e5 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9c52a68176d92157d2205f9637a4d4b53dfa50b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df4d9ff50cd6626b6486f487157c36d89213f879a00b926a85a9d0fb84d7bca5 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27f34796d278e3f15998f6e6900623efc30bb144 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c5d03ff52a2299d1cf99f549a7d5fee91ca29ffa1343768deb87940da182a19 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6418d2d238a1a48c9b63148d7a267e485a49c7b7 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68e26bbdec28c4a31d5b280c65eb3b40da929d2b935583bfe276a62bfa2e299a +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24f4d5d901bc96e0da5670d191593990650640b1 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edfd8f3b5c77b68fa3730674a480341556b13ddbed657e0fa32125fbb98000b8 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81fac8c61d01819767606be1635deb8727ee1836 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcd7a9b1426624f96f499f35ea8200d06a59f17d30996d7a4c9092118eb75588 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da53bf3a90f05576e9506fa9b90550de816e716f --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc51ac61a7f5d805ca13feb9894cf10ad5ab21b649548cf3880e2149490087d7 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8574ce9454b30dc4d829b8a7f2a3ae5ac1b2ace8 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04de1c0f5a69256472b9ceec8d252e9b37d969072df833869b44864853aa3281 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68315418d2b5d76c4437510880c5f6c4682adf10 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7be581f8c51e463893405509e41377b60efa5e70f9c307a5d2e3fbab3604b046 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d7367d247634008bb685ab8d4575c67b3ab2078 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:677d0293c407ec7adeead3367ba784c5a0f3e911d2ffc084751ed39ceefc20e1 +size 199058850 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6592f71d104fe1b8fd0a2ebea53ad7d6506a8d11 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6832e1604f6dbf3c48db590dadb8eb44c56a02081c261a1a7daeb9b468ff394b +size 199058850 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb212fc7df08de06c028b021222023bf5f8405c9 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9ef405567560a33df47904431779554a4a4d215c348905dfe919a1f14a0f54b +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29e6fb633315d09dc7238e0669e9da75ea5313f1 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9abf2249160f681d97abc1fa62a8ba84241682991b816d92f520b32d7f94aa3 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88108c3f1f43d6c32c3ca116a5c6c86668d4c087 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d9805045f6dc367bc112171be3544d89da129ff4ff97f7f3250ed3134877d96 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..062b56d899bf3c41ee5052199010139c06263c52 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f0beda6caa0312e614ece4f0e913df01c3a9236c537a5518641bbf92418774f +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5897f3524c7800b93b44d2aacb1138065a70189 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ab0f45567a422506fc66d440f7ae56b5ba3a80c39936739479668daef4e2dc2 +size 199058594 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bb8328b8edd309ae8fbe05ea8eae4e93f0c222d --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91ae72865096a06e953d1547980cfcf7b0ce58d176ae46cbc65a87cd482f7048 +size 199058594 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bac974134b1992ea9937a7e2801a651225324844 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da2576e07d3a0e62f6a008bff2d8af46f9e2044708d21cecaa266b72864e4d49 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97c3de08e90eee053323ed623bfd2c1b64b2cc30 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e36a5bda70ec1c882a7e50e01f7fa00a8cbab6ca83fcbaba647e61d6071fef55 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a8f551a5ab8b41ecc3b92553c490e94085b286d --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27d14e4c86a7d6aa44d27d8842b9fa9e07ec6ea748c8eb3541ffe4bf27eca8b9 +size 199058711 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b4e13dc6eba847983911e819c0ac0eaa86b72e4 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c80e1a4b16484ffd8b3b3dbcf95407cc002a1ec3ab7dd9c50282657454b846f2 +size 199058711 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3689e58ab5c3dbbd705a870c95123b7a92307e8 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:555df6cefee4ab28575e445ea8cf62f6b72bb90e084c91b88e18c12997ae7556 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33713289e1bbc850aaebfbd77c093e11b764c615 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b8ec94298d9ecb88a5537d9da74b28876d421a8f38f5d0b37398c2003978fd7 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93d6e4226c67ee3f3bfa438f4a234bf4372fc559 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:086be9ed6210d627158f1c6d0ca289e9e929420e948d3f1cc60878c8a3e7ed0b +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3135d31611f1a64c57e0a3a386a6e15f12e218a --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80001a30620bae5ce7e8826186da9ae66080b2d95987745e6f2b38b27809c255 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..714118f85e9fe0f0d4f5a506c6cdf43c7eb072cd --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb4a8aee01484a888a3dffd941d6a1bd22b134379d7a193d7b618e35582e587b +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a8971d26b9e38026126fd660724b0cf40e5ab59 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0682f26de2b8255f843951de1960e707b1c634a4499e84bdbd181c55cb28dc3 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..279295445b4730bb8dd333bfe30b44fb0ef2621f --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c62028dfb563f0bf67f4147d85faf0d41472470248a3418d71d95a0e3b89f5f6 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f83b2897e9342e80dba43c5adddda8a42197c1e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9380f95f31dee007b7127327aa3dbfb352d65ee46196e8e0061ec16ffb4f7b2e +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd58d5bc649215ac918845d8b255be4612aed75c --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:949b42e912cfe8af4dcb8d2236008d8decb598fc7f60cd5a70f7c6aa24cdb0ed +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f69e05ac728d0bbb65998b5723b746b7f382ed5 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:367c23edfa70ea3dfcb3cbe377f3e7b78c995e7bfe5d52d2f662979a5281f559 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..686e7523d22e1f4a423dfb36d1030675ccf77c1d --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c591259b582fd29a8fa50d92e5ff41302374956fa1b1d1b0f652c455367ca805 +size 199058594 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97062ef22f8482d65d578233e591c682ab2fdb70 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82a908a2f9e75d1be99dcf23cce493691308ecddec44113f092d048642e28e28 +size 199058594 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d06282f24614fd6ba9b79c8d6ea38af93b1f1ed0 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad1065b46defa49f7e7751fff476ecae94c897cf3f1abdac3bd2c6dda11d4a79 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec94d9141d05f69aae757a38d38cd6a5fade8ca3 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:196d8cd68324a9989436532c73bf952025d2dfbcec86bdafaee77dae7bc6cd05 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b2f5534fed1664bd7d4ede35918b8fe81fcb48e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b506f9408926664b78f2b81567e9794d72ed7f1ad652dc766e43e3a82b307836 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2593dd574021fd05e03ea87bcbc0d9347b046e16 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad04c1a3e9f0e64f9d5bda31ac1a90780401f4f1924679458b0212a80664dc1f +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a04a49acc8e6e950bb149aaf0b6c2b20e862dd98 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef4247542c6267ff6df617fc1919cde5ed389332efae8f904646740c3cdc9d6e +size 199058850 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de1df65a12a10e51e7a54448904c7e2ef3c819ea --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90c0d3ddbe82bf2faac8c3559568ae578c514ed69dfe7aba75c66cf7aa100e68 +size 199058850 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65c497b1d08f20727c494aeb5bb2d162d5824c85 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94aee15070d0f011a03844842d0e3063e8c025f0356f74d9ce2249af2448c214 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64238a068fa90f49cccf92d109bcfeb376fc0958 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f8b27b2bd15d9bbac27d30e5cacb36d8877ebf75317e4ab329bb7beeb1a7936 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d4d46bcd5955d4c84e7c96d49e436fef71af686 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03114241b333dca053e45b901b053deba1808c8b634860e30b465fc56ef1235f +size 199058647 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d83e75e69866ad9f4845c31a330018463b585930 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a268a499cab9d3c81a7628ca14f67ad94b507c635c4b0daadc30048e60ae5a69 +size 199058647 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..914edab07620f2d69a82e0edd34750149f4384ab --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b78657794153fe284313436a4568f2c90c12deb0ddf0a815096ca00594cbc9cb +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03549c5ce6d7fc6edab9be495f90726746faee51 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc7ea1ccbf7db3ba155aac5e5221a4929f1bd46d58fffdae34318c1f539ff6b2 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79a2d92b5795138fd46dd486ee89b9e8d2f6fdbf --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f23644758898e73c42e45eb21b541ffd560fe5de836946eed69ee4b6b210369f +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88452c9292538b07e215a243f68e9480737cc1dc --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90fdbf842853c8ec58ce877185ec89b16d76a110e1dae03760e057580709db87 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb1ede5e2135d596bae9e17ec64858c9c821e18b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:969d26099814b4b62d3483e6aa5e7fe2a1694ced9344ce2a1bd2fbaa6f720348 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a99e4f7b153136183a78c1491dade1c8efee9f8 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79aa89ca6b68a4bfe9db6397d22d94c55ef0bdbad20f590f1948e4dfcacf0104 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03355c9d5789148cf99c1e52d3295693571313d1 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78fa7e66431da1d08950f71368fa6c46c47a38b7ba63ea359848532a02c9da99 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..307cc684393a0aa4f3d9c8798aa1e526d0a74060 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce628da0536721482ef684383429395156230665ed67805856d865a861049df0 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72b2e27ee571cb69df2e2b99c8c03c66af0d8c0c --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5026d651022867dab95255a511d5dc6894f4992908d1867aca8caf7f69f92c0e +size 199058850 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb91f7a0ae5bb04a66effb1116fbe7802aa7111b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b936610ed0ebe63966a7b379decc463d4856c3de45a51b4bd11d03c05f519908 +size 199058850 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b7bad993fabf1d7c63d3b7eeac1be47a5cec99b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75d321e126a1ec982ddc5a52b8047711fd0c77cb4cc1360c11c1f9f99c68636c +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eca00eaa409eba0069075ecb059788d07cc20cad --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ef2df9ac6631a5369732cb76bcee8041ea453a1a9132727b637a8299c36c0bb +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31901f2cba0feeef7267b47dc9185e3a0e815ecb --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8037f521e806527a89a8fa1589a0a5bba4e534a47368091e620d9e0d2a18ec54 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad5c7614948c721b99e4cf0beba69470c03915f0 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26e7579d796a671fd8947406579a26df466d0285be962ba7b146589281bdb4ae +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93339d8386bd9a57aa34a5c1b7b2be548e01096b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cab167e27601b76be2047f9ab291435aa6cd529e5b7019837d9e857e92b4efa4 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4560c95d52fa27575191529920b9fc6b1544fb8f --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76925fe7c7d3409ec757e1f138878fdc199c694e8b260a502c2ce2df8749edd0 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..024aab61c6f1761570dfa4b966c2829a5d04e2c1 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f89d4b8b61539e3a3e6f8c383233a969215966be10933475b08a92d056344d5b +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e7515e0b7b374b364b870ea53f93f63dcf71623 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d9908232b9802c3c7f395029347400cbf8910484fc4fdfff50fa154b0270b71 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dadcc07b128ca84c296ff77a5c2ce3311a60648d --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da4d1772129dc344e8aa39922fdd73341d0df62c485ddc0fb48677d0eeccaf20 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8753808794d8159879b8f24f0fb9e08c60db0b57 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aef9cf54c81d031a132df9e0be6cd0d5b8f9bbb22198558aa056ff2f51d5cb1a +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db6dd693a4299684483a916b31216d0be09b3859 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99f868c671d38ae8b40ba46796bc3bed73d8c9d177d269b207a85dbb50e5eebe +size 199058775 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1189c33b140b7af4402abe88c0d408eecf00f15 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:315a111dfed1f10a3025e5808482c1ddb345527639b52d75d91502fa11b20545 +size 199058775 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..724e1bc3d6be417cff0015257387ea319a6715e1 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19fee6ba9f7664a0e9b43b175898b51c0aecad1684c44b42a827bdfb077854a3 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce9a7fb16864c3c12b97900833738213faa785de --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6bd00ac2a7ef1ebc1034a0ca635aa1384513c12fd5aabee37f9a7a3c09c4608 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f4fc77dd9da8dfbbda489971a8a49bad25aad06 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8902f96271d30dd8c2421509b7d3174e528d35fdac7681b7c5a0b6c9e1a2024d +size 199058850 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eda44cf14de0a36ce10dcd6977bd857561e28f92 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1229c6284bb0f445cac1f50d40671df67bdf23de163fe757da574ae88359f0b9 +size 199058850 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..379587e7242ee989c3cd5cef80b0d71afac47a72 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9396e0989c987c30ac8e9d95b5eac016be72ce094350b79f3b5c7df4979a4dde +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21acb9e090757eb926472791912008930e4acf0a --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ff915a440d95437e12a52f5f7853660538e08fb74db1bc960964b7b6b433db9 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcdf82c5d7ad5ec3560e4e5d8f7b135c887ff364 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:878d1d35be087c7f4044a4316e12b306edff78b4da0b1cf3f182860a391753c1 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac6a6ef897dafe0f6f3564bb10ae5cea7574fe2a --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23aebfdd2c9e14bee463b0f953d6498e74419cbda3d2d4fb66a7cd6cd10db342 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67662b813f3a569fdc45247a7d91370b5d15a5af --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eb5d88f7562f0961100bba7eb0b0e5ca803648b6fefec6dc66f7baa9e8f8fcc +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4107a7b4505ffc943007efcf32562ebf194dc62 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72400a61d508e03c29259ded39d65a6f0d5fc7742f94517e6eb27d8b3d7675ec +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f9a842797bfb9e387c6929aba2b82f83b9f0a32 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0302168be3942068fb19f37793924af2fb2eecc55c6b03a1e7323d001476fa5f +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b34948ad5bf1c4f6d7a0cbd06b649d8f9034731e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61da7eacf87d764b2b47ea8cae28f948181e12f0180d139032c3726e564811cd +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9537a6908c330de19380bf0f661f04653e6e569e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bd199e60d6bb52135908db6fecb9a32e29107c9bbcefb576e0464f7f6610c50 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a759af7879df7806a8cff29864115f4edd16f773 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7615008cc8d998117e6e8e8a0a1aead3752224878204306ef2af79ec46ab80dc +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd64384fdfdaff9822b139b86d9b97f1033e0355 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ca94ca9b0f6282338388659f0ff8dda14925f9e46667ff864d836474fdc0a31 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1da2c4c3c17c8cc45c39a3adfc5489b995c287f3 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c24a29927db887a2b0ef89b0758158cd29ca700f2b2a2e9f90432067d72c09c8 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a160ba0f91f53f972df95ef93fe9c02f664701da --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3556d601483097a550941d070248a60e5c4370a468d62bf0e9ed452946d89b8 +size 199058914 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20536fe7bd8ec35d5a53cf6c63d2b47d261fef19 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38e8c7fa3c677029169d2803181d6202a2961b0bac69cfe9f979fc62fbdc19be +size 199058914 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d1e7ba4c011c7a93e5e50ce3c972f7fe9b44eac --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d602f3cee4d8fec9ddcc9fa324d79a946247147d5d56ed07e4349ed8bfdcfb41 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91cdb9ea0cefb20d0dadfb4554907168325b12f6 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc26e58485e5b57824e1bf2f9842f14b525e0c1239c8188961df065e5843901 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04d17858f33724c7ced438fdf1bf1a9414243285 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9487f622f121cacd267cbf4446e7dc0b7daaeec8d36bf60beb16d663284bc38b +size 199058711 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12e88e2143a4a0048d3e10e41c113f7191fe2de9 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbf22da57930f2c687701854c07954eac164d54bd1b0d3844cd5124395105645 +size 199058711 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..687a4ae08a8c54e6e604730ba2a6cfbc8c2d0e4b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d04882695553be37b50de7989c3bc00f65d250c830fbeae72d028d79b69d7cb +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c96ee9f8140351e65ca6752c3d7ce0770e3e9a1 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e970d4df17af04428d3476b513f782e2d7a1bff069ff6e86010334e202740310 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95c0932985614e39c2f41e1648ec77b4146db18f --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a156e0a9e5b7173815e830443e1828647116316baa2651870cbb7ba8c01aadd3 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29837360ee6079bda21ef5873cb14e36b3819cd6 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c42bb1176c1e84b3ab569535d62f40805fe91d8b755737065136aeb15591220 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de3292d16f5f57718703de4a5007b08918d2498b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:058e50f4280cc6f81c3a8f7741e7f79e6f5eabbd72d0fbd6f541b3aee32bb314 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..187539386e32be17c3a7787998105fbbd5369768 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab66d7be9d6523fc1e6eab9268d38fa247498089eb3b25cb07ad95ff4ec1a409 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6792456ab36bcdbad530b7d0c33e6cfa37be6e21 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3334ba270873a8eade3c95f87b3400991ff219cbce3316fca269e13a73eb48f +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea50a39900033be627eb78cacd6c8c0a1ebebe30 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:656ce630e29176e35c7199cef6d09eb6c9be5b222c201f07173b36b2f030d2bd +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c1203929d491a193f590929c985cc4b6b8cdde8 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1692f5ae606e279caf37077515a06d22fd7dd185d8863a0672d2a1023a957bfc +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33fde9fc4d31d63e701c117279278781fdb73e80 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4db28aaed8d80d97280d858dc424e079484fb7bca7bd81c05484c07dc89fa5df +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bc0df7f1483139550194b0eb5a97e01f8dfb91b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5b04a134e5b086761872ac3d9e7de2eefbb2464a96c8df6511e0504e34fce80 +size 199058850 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1ec87e88f5b314a7d27eb8b51f5927add142940 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d903e3540bc838bca1c440c787c762cec6342ff4d85400fc366e53911987286 +size 199058850 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d00dc9af4a9ea8738e26bcd7b9af42eb3e62fa2a --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1043feb5d26c5751fa280632912b02a91218166a71bdbf6b7dad7cee902e19ff +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebcfa43ebe8b501a86ec461552b91c8d1ac3a1c8 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:377ba2ff67221e7ba41bbf1d5429936dad1bcd17e74caaad9b529755dfa7afe9 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78b551f0c4d928188b5e430da8a4eea1afedd8c7 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e605c114cc173e0465bac744033f46e53a6d2fca122e2457539cac1141f3fd1 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78f48165bdeb60cb4692a0710c5932128d545def --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27bf6a7e785fa98bffe25dc5bcb7b7fccbcbd2f9510dc66141e025d857ddf430 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81ed802336ee38dcb74d86cd2c6eca31f1f5440e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:137b48bb12edfa78e2f5ddf250bc97f2567c23159c921ce9cbee4a918137d99b +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd4455e7b1cf6f085fc00333a84641e95b626032 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b2089c5fb5ed7dbb0a20c5d2add70d47aa4058dc293ebdff7837819b3521743 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64d755968af5195153a48cd66e63ebcc583b5f61 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c95909cfd7b265c22d1d307a4bda1cfb18f6763f50d45ea0a4edcccdb98a269e +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80a48ddb58ad18f9e510181eb90d50718c7856dc --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeaa4c6b7e207cf7556539da88cf56774ac1fec1ab0af224f206333b0984a0d7 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..716e9330424d266d7d785a0d744633b9da359c96 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5815300a0d4ddbf94c767c930370a66bdd7cb515d8523a6445551b405e52d0ef +size 199058647 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdcdc8955fbbad7155f0badf70fa0939d6104cba --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a578db6ae0de06e0046f5369c970d29bed64f8d3d52a850364c1e33d5869c8a7 +size 199058647 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4eb5bcfd916a44035fc61e3356b9b9463b1a9d8a --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bcf4b8902409d900a110555761a3855356dd0873c608539ad7c51d38ab86063 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f99ead1ca11adf2514dc7f516cd73daaae50116d --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1cfdb0f2ad86039e3f5548e3e42cb08474489aa5077e6fdcec6050c08aa6aa6 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e94e31e7bbba7724006e63ab6e7e1ebaf3ae2d1 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f9cf79c83039c8ef3c5d6b51fbc102d0da1c6fb95191d0a124077dcf707c3f6 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..605ea57afb54ceadf55c31771e05e9549988149a --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d58d1ca45ce0de513450b7d4e7c9806b86bbd8ec63539779cc2140dcdd5c796 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76ee56507c0f25400b35f3f52f64322bbb57fbd3 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4deeb4fffb4d9681624008045ae03c5dbbea30526f66906febb132df9df0e2b1 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76bfc4b41926af032be3f65c018504dafdac1b4b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:968f90cace47b76170303f5c5736cba1bdc7c2702003cd10d074a3bdcc88ea62 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..776fc24e540d1857980748bfc9c2ce9bd84afcf1 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b8398e3bdf5b7c5a78955a1cc4ef0658f656f8c09e5df005e0e07a395155beb +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9198b5aa3c3ca31e25ded1af17d4a136014c4e3d --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd1871409ab943ce628e8fbf7414590a5f9056fe75f6c605faab7eb63db10b82 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3f5fe14fdd4c34bd4b1c121792738610b0b6dcb --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8550d9c68c9ea68c4285e2c638801e963804dddb9d49ae1ac7fccd5a53fbd2c6 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb819ae416bced9e62e4be571681c8d5456351d0 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4056e192ecfa5335e59d8a005aa716d599380dc955582075ea363b55da229539 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..624cf0860c0db971131cc0bd614b66483c4a31f4 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e414098859f5bda63eb54cdd726a6a4defd0ad9011e583cc350eb29fc599875 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31ba60bc76a3586c0caf7b56fd6904ed72430a5c --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e9831507751bca73d76bb487bf1a6451914bb0e824c49bc6bea115472627313 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e310e86c4c03ac1031f6ccb69d5bd07d24cabdb --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a61c9929b1817aa12b4302377675db6eaf9839cacddaf9f8cadd60743372d6ef +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f031d2aa3a0fe4116a613b41ec0789e896d6cc26 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12dd43558dd1057f38afd5ed19d0d25f5f932325411a475e1432262109869d3e +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60bf23dfa66141e8bb56b91c98df7344d1b00844 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c088483b227ec2559412d2a4921401e16f57874489c10bba6716c06754bfac0 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1292612b300a1e6bd0938aff37aa0f497e131c46 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b996583ce813940710c5b4d8c06d2dd30d11df333a89cd984e79915c983d7a97 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e133ab50bf69f4375962c7661b1a82b1bc3d2309 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74b2661f1daef5b37cf613bbcf68c444d05c05c19b94078539974feb339bb0bb +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da4bde6058aab06a92c9ebb4e9f63a87d6fce07b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f932a625a184fa4eb5dee796fc662d2c87412a9c137ba0c455997d625c54cde2 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f57cb2cc3d00eb6b5797c287b8c6281e5b559cec --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05bc5cec7ab11bc31f93c4eb7b7fc7660783dfc2d83f0956c6dc6a885bd24357 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79bb6419adb3ccad571450360b055c815114f80d --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6415bcaee99cb7229a90c5c8b2962f7412da053f86b031d501d3f1381b696e83 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd685773ab22e18b8e20d93abd4dd4c013204cb2 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1af8d2b3055e21789123d11b70363bb16ce0ec601ff883ad6de493b9df293874 +size 199058647 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e326fa68025ac32b15830881963c7036674de6e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa5fc21c530648d631e60919407e9de605326d07509078f77a43ca9f49bce1ca +size 199058647 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2801121ed448bf0b781bc4ad23817175be7dc9c9 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3566dc853e49435793b4f5f4c522165573c837aaeceae4320fd4f25d865cfc6f +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6359341f31db3a4fc05d7e37228207ca743ad798 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07adc5629fd1beef7559b4066528c0436af3fb5a454559531fbeb41f512a4b87 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7537e62dab06cc3136e4bed53c188c0fd9680b42 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78ced2df56a971653aa6d5867d66f907e9eb37a1442b9b0d2f95503b58d8b997 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b6d340dbea28a15d8224d0e55d39e4b54144986 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28b782ab119b3b954108dd3075ab0cabdd0c4a8b41753f86c222433541a68c37 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d9281323731884c2387bf64ac6b44f55ac36cb2 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cff4c8713559acc701acf1bde695beacb9308c4be2885b9eec800095409f6a28 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd69911b2005a951e4cd27dbf172959908e423d2 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26f302327cc1ee8bd9a2a4ad7cce234b4d82f46c0a6ba9792c6144b0d5dd7c59 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a133eed7e32619a778d9933b4659b333a05365a7 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:708caa2f866d5a50a23cd982bf7a93fe144fecbef767505fe8cb5d30e4278e6d +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5955a54d2e907f0bf692db7961c2cf7c1f0a330 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:615d968dd67ef0b659851bd79f8689abeec1f62a0c06c0ec1f127ec5012bd814 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e42977fa0c14fcf0424f03367a65223305ae9f8 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45465afe67e7f88b3069bee5295babd99afecdf3105f0d1f372dea32d66c0053 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02829fced6d6442ebe7f001cac7c504c4d4538d0 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b5349bf045c1abe4065e8b7eac1b47997086b14a9d5f9a717ed62d7abaa2ef7 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f851735bb43524a9346f7fdad254b53442da8e4e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d38cec390a21b52fbc9db7fb9d55a6ddc10335e919eb62b89e190ae5a61459ed +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58ee29119fddd54d86502192f1e1ea12887c5b90 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c773100f11c1293280988422920294ca4406a83e51789d5baf1f9259c8e0176d +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b174b3368bd01f6fd731ae9e1eadf3599de299f0 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:133743ee5b2dc58952880d22e5aa9c5ce5bd7e65fb8317fdc97cf2514f27333a +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..516117c05344fb409dc584861758e1cddc559cde --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15b02ef8c5a10db94dd17b99363e2f4e61eb3265bd47c2fec74fd216a1586069 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb9fa3fba4d002883a19df8f74080514f98a28c7 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f70121bc008747d949de46b3ed54e8990e816e1dae4d9ff8727108269a796f3 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0f18e16e943681a5ce8c197e1cd8d20ad3b7fae --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b44e8d66d148ccf50462e3476e7c9bfebf852f8ad57dd76ced06cd39027a67a3 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dd12e06c92a43f3884eff8569ed41291f7d4de4 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:453ad2aa3ac3bcf247d8a2dd7a95322217877295bfb7cdde17584d88b669f144 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbc4e902494b47049766ee22b484534b45158286 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cdc9aaad6635f5b8d9667d7f76a43e19f3a18a00214337ae0702a237be2e5d1 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20e2978fca20f6cfd4c67683331e8540042b3532 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cf52a38a43c27644b0de8fc30b8fbf684ea8d4057d2973e9bc4c3af83389987 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5921c6646fb20770188732de682bb3f3d44d05df --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e77e8290f598e8137eacd77fb3b1255668a63661aa03c98d7437e11d055f7540 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8efe97fb5ad69be0beafb22fb1b52e85be353098 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a45501a3017b2060f6f943a4df070666adb0443390bafd2e517ec2a452dff8a +size 199058647 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f11de2ee085d9658e6bdd1c282c6d83cd94c3645 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:332f79ee2f2247245544cfd01d7a97d77673058251d803b3df9bedbfad6dd82b +size 199058647 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a722924b3e3824038a9df1ef51b4ae0fa8c9c22b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac98280f4e266d0d3a5a1ee1aa6f1ab946f94f56bdf6d60829dd54d96687e9c6 +size 199058850 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7885c346a4c48176f3826063268a664dc4b6dab5 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d0e7e4f085de591683238df6095fb1714e4427c82202343a38c401aa57f1e5 +size 199058850 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28f6771c8c6e5486d6b68ba3c8b31238da4a0dd0 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cb3fdf9f44ab97a89d88f5862f34c7029766d5748e3641eff932092788334ab +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11c7528dcfe878222498741a930554ac0b869014 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:934bfc718549067b89ff239ccfd1eced7dd0d75b5a746ae42048e46af4beb58c +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0dee6cca55d9ec71192a046f1e9b4c9b16e5101 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:063d97f4e15e6b68a4f4280fbfbad7edfd43afaeaceb565dc66c0d029cfcb683 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18b6b158e3ddbcd70e90f213b37b6242220c7efd --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9acd927b377d5851870d3ea6e5259036d589da471750a5575d46630eef9b4f5a +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b7e750cfb7ac2274934770318920708d75e01c1 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70433c2f1c2f1eaf9109cb7a217e90fa5c50d44ec3968d30fbb3f8256c979467 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e99462341cddbf15e1fe782b3a62487b40dd409f --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f31713dbceb960723bbdb4734ae92c0763e0a7a295ee0abc1cb9dfceefa1f4eb +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8835c3c514bfbd88d44b441efacceadf825b4156 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31556c364d1bd94c78262df769b707700b0bbf16ac1520eb1d00eccb81d66ba4 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1586e276c1a482615c2e4f1dce93af72caba949f --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:540c2ae36c4771aa68a8efe37cf221a20f30b33fdea81f30bc59c70f70fb62a4 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f441f9a196846740dd7b11d3ec64b4e5de29b4e6 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3c9882f91828161c3c7d4c63ee45e832bd0bfa8b03cdb64bac30953304cf6a4 +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfa516f3ef38c99bc0d0736237b30cdaf9b5c96d --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c623a0660972f7958fdaf28971ff14523af4a87104e36a28c572fbd37c8b938a +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f96ad7e5e4fd387915b437713def447931119d8f --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:361052c429e12dc4f259fea709eb186d4ad192141c89685308cdfdd12ffa35ef +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d0fe15b01abfd4acba88bd64acc6b1097b85935 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56ba9ad049bd63d291d3bb5d3d25653973c0aaab4df28281c55c26ca1eb3b90b +size 199058722 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c5f9f5b89b583c177f99f89caa1d1e3b51f1b75 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f10757c6af0e602d938c0ce43d60852d98f53535804ba5fb58379933a39ecf7d +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..734966419dc42ac46a13da17cbfe93cf0cd036db --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5e69cc6eefcf6572bca5415fae8e14675cce506805be9dc8275538defacebd9 +size 199058786 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..735cdac855935c30ad2ef2adda943499c9788c59 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dab256021c543a791f87c015435fbdedcefd141bdbd31cc64cab49056e15cbd +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..261615756105ea4830e47986209ea08d8ca56546 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecf0377fa35d0e135ef0b75c26d051b6089ac3d6cb6c0be550b04c9eb561e783 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2c128f6f5fd6e603a9fee647f9686c95f851d6d --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1623eeaa4653e9a383e9c6cf9ea37306e08f0cf9bfee914747b20e6cf60b8e1f +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2f2596c2fa0f7b87536cd81cec4b712e2ba5f50 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36a94df20f93f55a4bdfa3991e92c1e07738d9a9f83eafddf531a336898e8eb2 +size 199058658 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d3b257793155246b94dd0f3605ea0bcff1ebf23 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95d220ded0de3397414f7c22b5ad98ff6a86188ac6d8bfa4ff120239311e49f5 +size 199058839 diff --git a/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f14cd0352903c31433552e1f40e4dc7a4bff85b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6d68c9fe1321097b41af482101e00720effe1e540a8dfff780e45912f75b757 +size 199058839 diff --git a/4b284b84bc4seed4/global_step80108/layer_01-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb6469d9180e0c2efb1e7eed3b241726f68939e0 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:191c0bf6260795d2cfe5c25e233e87539c918445b0c99e9a590abdb13f69f0d6 +size 167511299 diff --git a/4b284b84bc4seed4/global_step80108/layer_01-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..286ac340e25fbeaaf74731b092951649d3083deb --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b80dd1ff52c794b43ec1113977930d991b9eb75aaf487ae9179c94e491b2815 +size 167511299 diff --git a/4b284b84bc4seed4/global_step80108/layer_03-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18e76cb372ff5ac6ccea0c400faa2bec4434b259 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:117e67601aa7418eb0bbb8feab3bfb497358fee4825de256f3c7c9e5d8d9b6f9 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_03-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30a01d0b6d948e2e704643b77584043af5ee4976 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b891f06b2717e15dee81d838af78227990a605b4c3f75c995967920bb1232dd +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_04-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a61909780f9a6fad5b76591e29125389c023ca8 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50f9a28b4a0236ab09e6ad9f9b6ab6c8260eaa956ce00daac176f09a55a11579 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_04-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5df4c5c432968edebe2b24d04bd497e3a1487ca4 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12763434388b929ec1128e8539e8ec916762ba040404ad229005973874e14a65 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_05-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80988147f10d0963de49768584840be4e3998a6a --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81c14882d686610ed03fe4bfde1c5cc9fb2b1d9e7bdfaa392a38f855c2ded18f +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_05-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfc4768bff2990fd1248123d22201e36196426fd --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3589c1e5ed7bca599500496419316c754be0a2506196420f73d15064b6b6788a +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_06-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81e64fe4c708b9ceb5ef29f9b01c78092bb64047 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:909d9ae0cc074cc813da1d0bfdb94fb3c955ed1ed1f952a39d77b0227d16504f +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_06-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a23f1ea7a7162019d107dec112f900bb3726443a --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed6d767beed0a670d9d56f6cb4523658f3cc0462f9b351e915889c1385bb8214 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_07-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e72bc7b411e91d504f1d1c8b0d6c92fa972f6771 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2c310f1aaef648f55061cb075bf188f650840a9eb472338940a9d5c2255604a +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_07-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..782711064de465711dc508ecb2cd24395a947c0a --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d94959a073af0cc9f2498ca4e8533c240ff90887b7813bea08d2f31987b2a46 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_08-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d53b6211e119fa1528e80a49fe785559e0559d95 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18273960a21d52acbf685a1d632fd64c9792b41a7def9f65f32a51a6851178f2 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_08-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8e62cc4ee6b9c02264277a1c8427d634ee79d59 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc231234965d4c171f01ef7ca685b69e8a009231989a1dde0142f2d1df74aaf2 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_09-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa7a11c5fefc0c3cb434b590b176775d9917bc4f --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:054cbeaf14683cd6a2eccd5c6ec06c08a144915330674c71d25f7e9415b0a803 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_09-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3bab3a6be23400ae2709a6f6f94621d2610f619 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c655fb383306aa77eca3a54250cac7a38808ee8d606bfec022a9561ca6fbfca3 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_10-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..292ad6a03f3f51cab95dec78c96189bf8eb49e05 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4331d5936c36e45d540ce479d68eeffa218df1f94a2ef5243811c34602b919a +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_10-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..546b384f26cd028fa540e672887e61b83db5532b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1ca47724f2fe49ab2b15881f3484925387336f9ae58ae607c4d560bfd7d383a +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_11-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30d57fc26789257685336c9f5f408192e0f24c6c --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b48035b12326fb1729fc491443eada915b81000814d9b81116eaefcd6589bee8 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_11-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a25ed841a3152615d254c77ada487875795a40c8 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:716912c1d31b85147de4408ddef5a07d2a0e2eccc7a4cbf07dd0378562285cb8 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_12-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0ec51072338e6946b7d4c7d423c3a4d34104171 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7daa99b8a4cd994fa31d8dc05526b65b8b1222fd5ae7948bb90ea5ec77ed6cba +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_12-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f9100f5d955f922ec9e5e111a7b932f6a6e6eaa --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d89628d003866edf1cd8131531a176448d8f44bf2a2ff69547a0edfe0b73c4a +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_13-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29d67fdd0540a463bcebac309facf9b17aec3913 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dff0cf4c6a2f0edd4de870c955e1717d486d185fd097c1070d7f478b992487a9 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_13-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a036f4f7df274dadb00f061e121e09f7e2d84a53 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94f01846bd99af0557259cf9ff4b28709ffde8625c21f2894262c0990b958e05 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_14-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..670a0b148ce9180d6d68b5997f83e7bdd2d8e26f --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb0db31e4a5fee1677e5848a378050b2ffe06b7d65f7e126cce0707b0a3d9170 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_14-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..371c4c50e4d10893b52b0c217b50cf8907e1b1cf --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3310e989241b723d95c84ee75363b72fe81ea23f32aec23c6a77cde931c67f4c +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_15-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68f6d3679d5c0d32c3a2daba80fb32e4895fa592 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a7a6cbfea7f93dcd20053ebf3732300cc7f4a0e3ef8ccd989d29263c35e4c1b +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_15-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c5ac8eab47f2b41c7f7ee6dd0a56d7a83d69ecb --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d146a7e5f470f576200439477c2236464812b559e8cf81ca38a21e0b7b1f22fc +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_16-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..268d87f182db5da8d9b98f3aac76ebc02fc36eaa --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39a4a2391a15dd1a436f61f39858dd3f9e746011ff8af349a6979c15d4ef3081 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_16-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..388fba4b154cf9c7fc27e88863f9bdbe6182b1a3 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5d72e2f638f4cf0a680e9ddf10b83fde2d0f61f13a5bbd3e0587b25ccde5e76 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_17-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e31bf9f1772f8208e7cfd6b07fdb293bc8ad077b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8deb8bcc3f344b094409792a3a9e6709002100b0d38cbf035e64018bceb4c9ac +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_17-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4e38ac5dd0300cbe825055e273edd2ed74bc326 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cb878574dd6b9e8c2ab0e345fca4a5428a1fabe892b243baef105fcf2f11c5d +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_18-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81a2f097aba5e6b31c98b1690a4f7cece3ef6d30 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13a5070ce9bedd8fcea6748a9befd032ea15fc231ccd145878c03c76b49a1c70 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_18-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dac919cad18509824892ca082f731dda0264681b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1507cbbe045d0e5ab9dc07ca674c47d4bdfc7886cd67ddf75c94665578360663 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_19-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..091fde39102fe65634269fd11caa1f5378ff863a --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5105a5fd61ff699617f1605773d5917bb0c87d411904fe1257b5648a901b7c3 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_19-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd66fc9d50a3ca429001315c2f549f1dc528d37e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73b4c424143a93de12116bd71cc7b7ec548675f186f734a454cf92ca7e6fbcbe +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_20-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df505a46f569ad03bb512a64c5c6d4b9a65f4ac0 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46cbe45f30847d9ef1b174748554a56e5226c79a74c18573b69bd675a1a6c1c0 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_20-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0516ccefab05bfd650e434e18cdb72338b1499c --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e8564faf00e5dd23435aefb40e44ee74e39a839b34ab805ed175f02b21ed2e +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_21-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..524332d444d96b1cc89e9bd6bae1742c372c1725 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdf3ed0121926dd1390346bb65baaf6e3c724fc61fea79eae7b021df12047751 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_21-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45bbafb8e06df95f63470d79a8d31e1f7a23d0a3 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:418a4de9f7e06c72f3f3bf1df4fac67c9433facb63968c310bbac5d933c9ed44 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_22-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39f6186a10e3a585e4ec67083268df508f6f51d6 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60bde0ce17262d9e5ea26b81196bb3efcee6902a9e08d5b85c439dd1b5f991a4 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_22-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41cefc9632dfd262a8a380caea73f5a170c8ae6b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:461929085afb2dab1b2086548df3abc62a0e3106c1a88ef54f8740697aaee812 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_23-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8114fda6a31afa53eb744bb4db210d42bfd0cfeb --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c272b69421c5d8b4c27dbf365b4f5925d9e5c9474dc3b689182d5b734df900a +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_23-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9b72f240027bf1b089a718876d41b94552b51bc --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17c1b183ee105d46fd2d15538bf01b7f4d9b8be8fad87ca701e4c33552131582 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_24-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccf20cdc985bb3b9b5f83ff5d648b72f5c821b1c --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3050f4e60a2b19752261d78fc446ea87984d1cdc9b70fef66d496c4ecd342a33 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_24-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fc3d0125950296182d05fd346e95b58f0b4835d --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b04c34569596a3312ef93ad509171a0b5f8c42b96c07f16a57d66c3a16445ce +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_25-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..106fdbd20b7c33d0199188c78b78a34af26579cd --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68b44582c19bb3dfae1c9cdc530e4d22d6ab0f7a84f4d8764f2dd977a80dcdb9 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_25-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14afde5c97437b5f4b655747235ba0af3d40c72f --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd6e996fdcb45a9b64c02a0bf1de22e68770ba9214f4bbf4bf20d3a0c05917d9 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_26-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc77111fb0be07be77d32206c22fa3716e5ca709 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16faa40915cd684bbece37848d94f5c0109ea059f109f0a39aa031fa075f0e2f +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_26-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..526d87e6225c6410b954626b0719fd042ea3ce4b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:409aa3c644ae6c2c7424547d6aeff7422884348a10b5d39a7b5f9a7fa237b3fd +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_27-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8857a8d7e6c35d61d1b4c864311a159a1459a4b2 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:953dea356b93c2a0b7476ca1858b6a5b0d78b122e58bd3c657e1997ad82e9a9a +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_27-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0d95e0d077b2984ce8c3212716ff701a6b590fe --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8df81dc19defce2c86cc5d56c673ab1b6926d4f8ade2a681132a8a5cd2e0836d +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_28-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b271029c89cff56b5a0718df8f6645d59149360f --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aa74b151db86b2974ec0ad197fceddef57fed406f356e378faa6745d14ad138 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_28-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6862a9e0b6e530dce8b16b2c1929401c2752f4df --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:904fcd0f4993677beb49eef61f12572c550f96edbdfc9f9d2a0f149b9c3b22b3 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_29-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..daac51cdd4865ab71f8917b0e1a956b97d2a0544 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:908934ce0e16495c26dde2821871c58d04aeae811519da78087ec9323ba40ab4 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_29-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..428dd252af7ee52eddefffd83338e257466733ff --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ce45add434bb91e3ccf0f4a4624deb3cbf2a96be242c62ab6cb96cd5fd35dbe +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_30-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fc7c441a9f53f0a7e3c06eb9fda27992e6ff8b6 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e626106da0a17102888491441e8bf93e5729dff66529e2adcb907109017504f +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_30-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18cf8faa52cd9423a319f619c8d5966087be5ec9 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdc0288b70ed0f92e720dec680aa78b56dbaa0ddb2659cb490389b725f4807ac +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_31-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0f3dc3085b060794ecfb030c6282afafba8054b --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bb4041a88fd6ce3a57c22764f56e8db2b108db6be5e70ebbcd0dc5adaeb1e27 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_31-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..709ace02022800b9ec35a24080d42bf9c2f968cc --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:634f1449056dfee3e764608821c95a8c19b2964217b8efc58cfb2b1250f1abd7 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_32-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a37993b69d92ef2742d04f1cd45dbb03cd2c114c --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6a7e51d8ee981053eaa89c42ac0cde16eb1c6da3c796e190a928caee6dc37ae +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_32-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b0384e482ef73c2c7ebce48e692e7bf214e4901 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0303d9e0546161557c06b70f7b78b750b3feb708cbce324b8084a232fa7b2aec +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_33-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d1486554663953343148205a20e3dceefb3dcee --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a4917a8b0ac6fbffc8ecf59ce2e221de3e1346893c3e331e1c23c61c0f109cf +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_33-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af32bb6651981e9082e6315edfd1c9229bf47e40 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c736e1860e9452a68dc769d8cea47beb43cf02bbc483d0234382fb6b5583c63 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_34-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c9bc627a8a6b0ab9c5c73d7564045a485c055ac --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b186dc76e1b7bc0d0aa98f94ad3d0c7d675d3223e145a2263872aaa43ad4e80e +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_34-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ec4ad18caa23bf84b2db26cbf2124e309de86d4 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8f9a436515bd106ef48e891ca76f5cde797c662a6ded9bbaedd70de1db4095c +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_35-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4e4670119bcf51287679980ebd8558cdfdb55b1 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7d18b697fc2d811762a77c53c4c162146c70ffb979cfff2f00af9ed959c3d10 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_35-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff4ea87f93706b5ba7da0fb243677eee2597f2ad --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0baeb5d9252f7a6e6e60bbd377bd9934c681e09412efdb7a9210d1a140160a1f +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_36-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bf74f0494a798828f07ea85faa0fbd60999f662 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c219f3a6ee5b65a57707a9aae3d02d61a55882dbd46fba6ac89ada3eba117e92 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_36-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83e129595b93059e4c18454bb9f8d176d7cbc268 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c8583aa8967f2e82d6a2d282e49e69537b0a2125b56b0e31ea88fac058c6a85 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_37-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e55bc1611ffcce160b6443b15b44264f599f11d3 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c10369200283598b95f5dcc249fae1e9b7a3ac3e1adaf8c631e50a0dee39a103 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_37-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29dccada14fa571fe7675ca64bd9dcfd79679bd9 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f36325211e927219cd675e0560dac8c260c38ee2a3486fbbe19bd2c7bd7db9e +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_38-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa441a02e2560295a18e6ce8bc46e001ccb65d85 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f0175cd7b455886ffa4b561a65ece005b8ed89f20e7254e9a09d2afe4252194 +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_38-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d05a1cdb357258de79d47013681defc40be5b38e --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e10b5c54bfe99099fae6aa0631a5d10a36e0dad3c44e255566f600f1c1d7f5c +size 113308931 diff --git a/4b284b84bc4seed4/global_step80108/layer_40-model_00-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cc715f9e9f4cdc82f807cf4b39bb4147a1016aa --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f29bdfd6cad29304b1376b42c0d06f4bf972ba6af60b43c6ce6ca41d3b76b71f +size 13507 diff --git a/4b284b84bc4seed4/global_step80108/layer_40-model_01-model_states.pt b/4b284b84bc4seed4/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6f2086c6cf5f53342ef0d071b5a00f4cba6f09c --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4f840959575575b01260ba5213fddcd02a98126859e926d9a7a82de68932338 +size 13507 diff --git a/4b284b84bc4seed4/global_step80108/mp_rank_00_model_states.pt b/4b284b84bc4seed4/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fef62ee195192c1ffbad07d6cc112b2614ca648f --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fc8037c76ba30b6d5e6de4c7f0b92b82adfd83657492affd342911f6585a3f6 +size 51443 diff --git a/4b284b84bc4seed4/global_step80108/mp_rank_01_model_states.pt b/4b284b84bc4seed4/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac3d9eab0e20e20133c8c0c35ff693d401cb3723 --- /dev/null +++ b/4b284b84bc4seed4/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b6c7c0fd1027c79b573543faada3628e9621e62593bb0d8aa3fe77f3b303c60 +size 51443 diff --git a/4b284b84bc4seed4/transformers/config.json b/4b284b84bc4seed4/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b84bc4seed4/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b84bc4seed4/transformers/pytorch_model.bin b/4b284b84bc4seed4/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..cdc073651656385e0b6cd62a6dca72759788761d --- /dev/null +++ b/4b284b84bc4seed4/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:574d4eed830d74195847ac2f8e61b3cf8378080a00fd6ee9679b0f0e24c34e48 +size 8781203669 diff --git a/launch.sh b/launch.sh new file mode 100755 index 0000000000000000000000000000000000000000..6c3445845a5dae614feb4b8a1206322cd7bd9050 --- /dev/null +++ b/launch.sh @@ -0,0 +1,53 @@ +#!/bin/bash + +# Launch script using torch.distributed.run(). Used by slurm +# scripts, don't invoke directly. + +# Samuel's fix for apparent error in SLURM initialization +if [ $SLURM_LOCALID -eq 0 ]; then + rm -rf /dev/shm/* + rocm-smi || true +else + sleep 2 +fi + +export NCCL_SOCKET_IFNAME=hsn0,hsn1,hsn2,hsn3 +export OMP_NUM_THREADS=$SLURM_CPUS_PER_TASK +export FI_CXI_DEFAULT_CQ_SIZE=131072 + +# debugging (noisy) +#export NCCL_DEBUG=INFO +#export RCCL_KERNEL_COLL_TRACE_ENABLE=1 +#export NCCL_DEBUG_SUBSYS=INIT,COLL + +module --quiet purge +module load cray-python + +module load CrayEnv +module load PrgEnv-cray/8.3.3 +module load craype-accel-amd-gfx90a +module load cray-python + +module use /pfs/lustrep2/projappl/project_462000125/samantao-public/mymodules +module load suse-repo-deps/sam-default +module load rocm/sam-5.2.3.lua +module load rccl/sam-develop.lua +module load aws-ofi-rccl/sam-default.lua + +source venv/bin/activate + +MASTER_NODE=$(scontrol show hostnames "$SLURM_JOB_NODELIST" | head -n 1) +MASTER_PORT=9999 + +echo "Launching on $SLURMD_NODENAME ($SLURM_PROCID/$SLURM_JOB_NUM_NODES)," \ + "master $MASTER_NODE port $MASTER_PORT," \ + "GPUs $SLURM_GPUS_ON_NODE," \ + "CUDA: $(python -c 'import torch; print(torch.cuda.is_available())')" + +python -u -m torch.distributed.run \ + --nnodes $SLURM_JOB_NUM_NODES \ + --nproc_per_node $SLURM_GPUS_ON_NODE \ + --node_rank=$SLURM_PROCID \ + --master_addr $MASTER_NODE \ + --master_port $MASTER_PORT \ + "$@" diff --git a/sbatch_4b284b84bc4seed1.sh b/sbatch_4b284b84bc4seed1.sh new file mode 100644 index 0000000000000000000000000000000000000000..39022f3f6a3b0bf6d6b32152386dc474fede981c --- /dev/null +++ b/sbatch_4b284b84bc4seed1.sh @@ -0,0 +1,164 @@ +#!/bin/bash +#SBATCH --exclude=nid007571,nid007112,nid006774,nid007502,nid007506,nid007507,nid005145,nid006692,nid007218,nid007123,nid006124,nid006123,nid007496,nid007237,nid006852,nid007206,nid006947,nid007212,nid006977,nid007222,nid005444,nid007219,nid007493,nid007221,nid005300,nid005619,nid006118,nid005203,nid006113,nid006481,nid007077,nid005208,nid005207,nid005879,nid005901 +#SBATCH --nodes=32 +#SBATCH --ntasks-per-node=1 +#SBATCH --cpus-per-task=40 +#SBATCH --mem=256G +#SBATCH -p standard-g +#SBATCH -t 48:00:00 +#SBATCH --gpus-per-node=mi250:8 +#SBATCH --exclusive=user +#SBATCH --hint=nomultithread +#SBATCH --account=project_462000119 +#SBATCH -o logs/%j.out +#SBATCH -e logs/%j.err + +VARIANT=4b284b84bc4seed1 + +# if run without sbatch, invoke here +if [ -z $SLURM_JOB_ID ]; then + mkdir -p logs + sbatch "$0" + exit +fi + +set -euo pipefail + +# symlink logs/latest.out and logs/latest.err +ln -f -s $SLURM_JOB_ID.out logs/latest.out +ln -f -s $SLURM_JOB_ID.err logs/latest.err + +KILL_SWITCH_PATH=kill-switch-$VARIANT +CHECKPOINT_PATH=checkpoints_$VARIANT +TENSORBOARD_PATH=tensorboard_$VARIANT + +# Data +VOCAB_FILE="gpt2/vocab.json" +MERGE_FILE="gpt2/merges.txt" + +TRAIN_DATA_PATH=train.txt +# "train: 1.0 0:1 /scratch/project_462000119/data/c4/gpt2tok_c4_text_document" +VALID_DATA_PATH=val.txt +# "validation: 1.0 0:1 /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document" + +PP_SIZE=1 +TP_SIZE=2 + +MICRO_BATCH_SIZE=2 +GRADIENT_ACCUMULATION_STEPS=1 +WORLD_SIZE=$((SLURM_GPUS_ON_NODE*SLURM_JOB_NUM_NODES)) +GLOBAL_BATCH_SIZE=$((MICRO_BATCH_SIZE*WORLD_SIZE*GRADIENT_ACCUMULATION_STEPS)) + +# Model parameters +source model_params.sh +MODEL_PARAM=("${PARAM_4516M[@]}") +NHIDDEN=${MODEL_PARAM[0]} +FFN_HIDDEN_SIZE=${MODEL_PARAM[1]} +KV_SIZE=${MODEL_PARAM[2]} +NHEADS=${MODEL_PARAM[3]} +NLAYERS=${MODEL_PARAM[4]} +SEQ_LEN=2048 + +echo "Model parameters: d_model $NHIDDEN ffw_size $FFN_HIDDEN_SIZE kv_size $KV_SIZE n_heads $NHEADS n_layers $NLAYERS" + +SAVE_INTERVAL=10000 + +# Tokens: 84_000_000_000 +# -> Samples: 41_015_625.0 +TRAIN_SAMPLES=41_015_625 + +OPTIMIZER_ARGS=" \ + --optimizer adam \ + --adam-beta1 0.9 \ + --adam-beta2 0.95 \ + --adam-eps 1e-8 \ + --lr 2e-4 \ + --min-lr 2e-5 \ + --lr-decay-style cosine \ + --lr-decay-samples $TRAIN_SAMPLES \ + --lr-warmup-samples 410_156 \ + --clip-grad 1.0 \ + --weight-decay 1e-1 \ + " + +GPT_ARGS=" \ + --num-layers $NLAYERS \ + --hidden-size $NHIDDEN \ + --num-attention-heads $NHEADS \ + --kv-channels $KV_SIZE \ + --ffn-hidden-size $FFN_HIDDEN_SIZE \ + --seq-length $SEQ_LEN \ + --max-position-embeddings $SEQ_LEN \ + --micro-batch-size $MICRO_BATCH_SIZE \ + --global-batch-size $GLOBAL_BATCH_SIZE \ + --train-samples $TRAIN_SAMPLES \ + --vocab-file $VOCAB_FILE \ + --merge-file $MERGE_FILE \ + --clip-grad 1.0 \ + --kill-switch-path $KILL_SWITCH_PATH \ + --bf16 \ + $OPTIMIZER_ARGS \ + " + +OUTPUT_ARGS=" \ + --log-interval 10 \ + --save-interval $SAVE_INTERVAL \ + --eval-interval 1000 \ + --eval-iters 100 \ + --tensorboard-dir $TENSORBOARD_PATH \ + --tensorboard-queue-size 5 \ + --log-timers-to-tensorboard \ + --log-batch-size-to-tensorboard \ + --log-validation-ppl-to-tensorboard \ + " + +ZERO_STAGE=0 + +mkdir -p ds_configs +DS_CONFIG_PATH="ds_configs/$SLURM_JOB_ID.json" + +cat < $DS_CONFIG_PATH +{ + "train_micro_batch_size_per_gpu": $MICRO_BATCH_SIZE, + "train_batch_size": $GLOBAL_BATCH_SIZE, + "gradient_clipping": 1.0, + "zero_optimization": { + "stage": $ZERO_STAGE + }, + "bf16": { + "enabled": true + }, + "steps_per_print": 2000, + "wall_clock_breakdown": false +} +EOF + +DEEPSPEED_ARGS=" \ + --deepspeed \ + --deepspeed_config $DS_CONFIG_PATH \ + --zero-stage $ZERO_STAGE \ + " + +CMD=" \ + Megatron-DeepSpeed/pretrain_gpt.py \ + --tensor-model-parallel-size $TP_SIZE \ + --pipeline-model-parallel-size $PP_SIZE \ + $GPT_ARGS \ + $OUTPUT_ARGS \ + --save $CHECKPOINT_PATH \ + --load $CHECKPOINT_PATH \ + --train-weighted-split-paths-path $TRAIN_DATA_PATH \ + --valid-weighted-split-paths-path $VALID_DATA_PATH \ + --data-impl mmap \ + --seed 1 \ + $DEEPSPEED_ARGS \ + " + +echo $CMD + +echo "START $SLURM_JOBID: $(date)" + +# bash launch_srun.sh $CMD +srun --label launch.sh $CMD + +echo "END $SLURM_JOBID: $(date)" diff --git a/sbatch_4b284b84bc4seed2.sh b/sbatch_4b284b84bc4seed2.sh new file mode 100644 index 0000000000000000000000000000000000000000..e4eb3c72f986fcd6386db53acad0db43a3fcfcaf --- /dev/null +++ b/sbatch_4b284b84bc4seed2.sh @@ -0,0 +1,164 @@ +#!/bin/bash +#SBATCH --exclude=nid007571,nid007112,nid006774,nid007502,nid007506,nid007507,nid005145,nid006692,nid007218,nid007123,nid006124,nid006123,nid007496,nid007237,nid006852,nid007206,nid006947,nid007212,nid006977,nid007222,nid005444,nid007219,nid007493,nid007221,nid005300,nid005619,nid006118,nid005203,nid006113,nid006481,nid007077,nid005208,nid005207,nid005879,nid005901 +#SBATCH --nodes=32 +#SBATCH --ntasks-per-node=1 +#SBATCH --cpus-per-task=40 +#SBATCH --mem=256G +#SBATCH -p standard-g +#SBATCH -t 48:00:00 +#SBATCH --gpus-per-node=mi250:8 +#SBATCH --exclusive=user +#SBATCH --hint=nomultithread +#SBATCH --account=project_462000119 +#SBATCH -o logs/%j.out +#SBATCH -e logs/%j.err + +VARIANT=4b284b84bc4seed2 + +# if run without sbatch, invoke here +if [ -z $SLURM_JOB_ID ]; then + mkdir -p logs + sbatch "$0" + exit +fi + +set -euo pipefail + +# symlink logs/latest.out and logs/latest.err +ln -f -s $SLURM_JOB_ID.out logs/latest.out +ln -f -s $SLURM_JOB_ID.err logs/latest.err + +KILL_SWITCH_PATH=kill-switch-$VARIANT +CHECKPOINT_PATH=checkpoints_$VARIANT +TENSORBOARD_PATH=tensorboard_$VARIANT + +# Data +VOCAB_FILE="gpt2/vocab.json" +MERGE_FILE="gpt2/merges.txt" + +TRAIN_DATA_PATH=train.txt +# "train: 1.0 0:1 /scratch/project_462000119/data/c4/gpt2tok_c4_text_document" +VALID_DATA_PATH=val.txt +# "validation: 1.0 0:1 /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document" + +PP_SIZE=1 +TP_SIZE=2 + +MICRO_BATCH_SIZE=2 +GRADIENT_ACCUMULATION_STEPS=1 +WORLD_SIZE=$((SLURM_GPUS_ON_NODE*SLURM_JOB_NUM_NODES)) +GLOBAL_BATCH_SIZE=$((MICRO_BATCH_SIZE*WORLD_SIZE*GRADIENT_ACCUMULATION_STEPS)) + +# Model parameters +source model_params.sh +MODEL_PARAM=("${PARAM_4516M[@]}") +NHIDDEN=${MODEL_PARAM[0]} +FFN_HIDDEN_SIZE=${MODEL_PARAM[1]} +KV_SIZE=${MODEL_PARAM[2]} +NHEADS=${MODEL_PARAM[3]} +NLAYERS=${MODEL_PARAM[4]} +SEQ_LEN=2048 + +echo "Model parameters: d_model $NHIDDEN ffw_size $FFN_HIDDEN_SIZE kv_size $KV_SIZE n_heads $NHEADS n_layers $NLAYERS" + +SAVE_INTERVAL=10000 + +# Tokens: 84_000_000_000 +# -> Samples: 41_015_625.0 +TRAIN_SAMPLES=41_015_625 + +OPTIMIZER_ARGS=" \ + --optimizer adam \ + --adam-beta1 0.9 \ + --adam-beta2 0.95 \ + --adam-eps 1e-8 \ + --lr 2e-4 \ + --min-lr 2e-5 \ + --lr-decay-style cosine \ + --lr-decay-samples $TRAIN_SAMPLES \ + --lr-warmup-samples 410_156 \ + --clip-grad 1.0 \ + --weight-decay 1e-1 \ + " + +GPT_ARGS=" \ + --num-layers $NLAYERS \ + --hidden-size $NHIDDEN \ + --num-attention-heads $NHEADS \ + --kv-channels $KV_SIZE \ + --ffn-hidden-size $FFN_HIDDEN_SIZE \ + --seq-length $SEQ_LEN \ + --max-position-embeddings $SEQ_LEN \ + --micro-batch-size $MICRO_BATCH_SIZE \ + --global-batch-size $GLOBAL_BATCH_SIZE \ + --train-samples $TRAIN_SAMPLES \ + --vocab-file $VOCAB_FILE \ + --merge-file $MERGE_FILE \ + --clip-grad 1.0 \ + --kill-switch-path $KILL_SWITCH_PATH \ + --bf16 \ + $OPTIMIZER_ARGS \ + " + +OUTPUT_ARGS=" \ + --log-interval 10 \ + --save-interval $SAVE_INTERVAL \ + --eval-interval 1000 \ + --eval-iters 100 \ + --tensorboard-dir $TENSORBOARD_PATH \ + --tensorboard-queue-size 5 \ + --log-timers-to-tensorboard \ + --log-batch-size-to-tensorboard \ + --log-validation-ppl-to-tensorboard \ + " + +ZERO_STAGE=0 + +mkdir -p ds_configs +DS_CONFIG_PATH="ds_configs/$SLURM_JOB_ID.json" + +cat < $DS_CONFIG_PATH +{ + "train_micro_batch_size_per_gpu": $MICRO_BATCH_SIZE, + "train_batch_size": $GLOBAL_BATCH_SIZE, + "gradient_clipping": 1.0, + "zero_optimization": { + "stage": $ZERO_STAGE + }, + "bf16": { + "enabled": true + }, + "steps_per_print": 2000, + "wall_clock_breakdown": false +} +EOF + +DEEPSPEED_ARGS=" \ + --deepspeed \ + --deepspeed_config $DS_CONFIG_PATH \ + --zero-stage $ZERO_STAGE \ + " + +CMD=" \ + Megatron-DeepSpeed/pretrain_gpt.py \ + --tensor-model-parallel-size $TP_SIZE \ + --pipeline-model-parallel-size $PP_SIZE \ + $GPT_ARGS \ + $OUTPUT_ARGS \ + --save $CHECKPOINT_PATH \ + --load $CHECKPOINT_PATH \ + --train-weighted-split-paths-path $TRAIN_DATA_PATH \ + --valid-weighted-split-paths-path $VALID_DATA_PATH \ + --data-impl mmap \ + --seed 2 \ + $DEEPSPEED_ARGS \ + " + +echo $CMD + +echo "START $SLURM_JOBID: $(date)" + +# bash launch_srun.sh $CMD +srun --label launch.sh $CMD + +echo "END $SLURM_JOBID: $(date)" diff --git a/sbatch_4b284b84bc4seed3.sh b/sbatch_4b284b84bc4seed3.sh new file mode 100644 index 0000000000000000000000000000000000000000..d371158da1cd500cecdc768b23ec89ebafc92147 --- /dev/null +++ b/sbatch_4b284b84bc4seed3.sh @@ -0,0 +1,164 @@ +#!/bin/bash +#SBATCH --exclude=nid007571,nid007112,nid006774,nid007502,nid007506,nid007507,nid005145,nid006692,nid007218,nid007123,nid006124,nid006123,nid007496,nid007237,nid006852,nid007206,nid006947,nid007212,nid006977,nid007222,nid005444,nid007219,nid007493,nid007221,nid005300,nid005619,nid006118,nid005203,nid006113,nid006481,nid007077,nid005208,nid005207,nid005879,nid005901 +#SBATCH --nodes=32 +#SBATCH --ntasks-per-node=1 +#SBATCH --cpus-per-task=40 +#SBATCH --mem=256G +#SBATCH -p standard-g +#SBATCH -t 48:00:00 +#SBATCH --gpus-per-node=mi250:8 +#SBATCH --exclusive=user +#SBATCH --hint=nomultithread +#SBATCH --account=project_462000119 +#SBATCH -o logs/%j.out +#SBATCH -e logs/%j.err + +VARIANT=4b284b84bc4seed3 + +# if run without sbatch, invoke here +if [ -z $SLURM_JOB_ID ]; then + mkdir -p logs + sbatch "$0" + exit +fi + +set -euo pipefail + +# symlink logs/latest.out and logs/latest.err +ln -f -s $SLURM_JOB_ID.out logs/latest.out +ln -f -s $SLURM_JOB_ID.err logs/latest.err + +KILL_SWITCH_PATH=kill-switch-$VARIANT +CHECKPOINT_PATH=checkpoints_$VARIANT +TENSORBOARD_PATH=tensorboard_$VARIANT + +# Data +VOCAB_FILE="gpt2/vocab.json" +MERGE_FILE="gpt2/merges.txt" + +TRAIN_DATA_PATH=train.txt +# "train: 1.0 0:1 /scratch/project_462000119/data/c4/gpt2tok_c4_text_document" +VALID_DATA_PATH=val.txt +# "validation: 1.0 0:1 /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document" + +PP_SIZE=1 +TP_SIZE=2 + +MICRO_BATCH_SIZE=2 +GRADIENT_ACCUMULATION_STEPS=1 +WORLD_SIZE=$((SLURM_GPUS_ON_NODE*SLURM_JOB_NUM_NODES)) +GLOBAL_BATCH_SIZE=$((MICRO_BATCH_SIZE*WORLD_SIZE*GRADIENT_ACCUMULATION_STEPS)) + +# Model parameters +source model_params.sh +MODEL_PARAM=("${PARAM_4516M[@]}") +NHIDDEN=${MODEL_PARAM[0]} +FFN_HIDDEN_SIZE=${MODEL_PARAM[1]} +KV_SIZE=${MODEL_PARAM[2]} +NHEADS=${MODEL_PARAM[3]} +NLAYERS=${MODEL_PARAM[4]} +SEQ_LEN=2048 + +echo "Model parameters: d_model $NHIDDEN ffw_size $FFN_HIDDEN_SIZE kv_size $KV_SIZE n_heads $NHEADS n_layers $NLAYERS" + +SAVE_INTERVAL=10000 + +# Tokens: 84_000_000_000 +# -> Samples: 41_015_625.0 +TRAIN_SAMPLES=41_015_625 + +OPTIMIZER_ARGS=" \ + --optimizer adam \ + --adam-beta1 0.9 \ + --adam-beta2 0.95 \ + --adam-eps 1e-8 \ + --lr 2e-4 \ + --min-lr 2e-5 \ + --lr-decay-style cosine \ + --lr-decay-samples $TRAIN_SAMPLES \ + --lr-warmup-samples 410_156 \ + --clip-grad 1.0 \ + --weight-decay 1e-1 \ + " + +GPT_ARGS=" \ + --num-layers $NLAYERS \ + --hidden-size $NHIDDEN \ + --num-attention-heads $NHEADS \ + --kv-channels $KV_SIZE \ + --ffn-hidden-size $FFN_HIDDEN_SIZE \ + --seq-length $SEQ_LEN \ + --max-position-embeddings $SEQ_LEN \ + --micro-batch-size $MICRO_BATCH_SIZE \ + --global-batch-size $GLOBAL_BATCH_SIZE \ + --train-samples $TRAIN_SAMPLES \ + --vocab-file $VOCAB_FILE \ + --merge-file $MERGE_FILE \ + --clip-grad 1.0 \ + --kill-switch-path $KILL_SWITCH_PATH \ + --bf16 \ + $OPTIMIZER_ARGS \ + " + +OUTPUT_ARGS=" \ + --log-interval 10 \ + --save-interval $SAVE_INTERVAL \ + --eval-interval 1000 \ + --eval-iters 100 \ + --tensorboard-dir $TENSORBOARD_PATH \ + --tensorboard-queue-size 5 \ + --log-timers-to-tensorboard \ + --log-batch-size-to-tensorboard \ + --log-validation-ppl-to-tensorboard \ + " + +ZERO_STAGE=0 + +mkdir -p ds_configs +DS_CONFIG_PATH="ds_configs/$SLURM_JOB_ID.json" + +cat < $DS_CONFIG_PATH +{ + "train_micro_batch_size_per_gpu": $MICRO_BATCH_SIZE, + "train_batch_size": $GLOBAL_BATCH_SIZE, + "gradient_clipping": 1.0, + "zero_optimization": { + "stage": $ZERO_STAGE + }, + "bf16": { + "enabled": true + }, + "steps_per_print": 2000, + "wall_clock_breakdown": false +} +EOF + +DEEPSPEED_ARGS=" \ + --deepspeed \ + --deepspeed_config $DS_CONFIG_PATH \ + --zero-stage $ZERO_STAGE \ + " + +CMD=" \ + Megatron-DeepSpeed/pretrain_gpt.py \ + --tensor-model-parallel-size $TP_SIZE \ + --pipeline-model-parallel-size $PP_SIZE \ + $GPT_ARGS \ + $OUTPUT_ARGS \ + --save $CHECKPOINT_PATH \ + --load $CHECKPOINT_PATH \ + --train-weighted-split-paths-path $TRAIN_DATA_PATH \ + --valid-weighted-split-paths-path $VALID_DATA_PATH \ + --data-impl mmap \ + --seed 3 \ + $DEEPSPEED_ARGS \ + " + +echo $CMD + +echo "START $SLURM_JOBID: $(date)" + +# bash launch_srun.sh $CMD +srun --label launch.sh $CMD + +echo "END $SLURM_JOBID: $(date)" diff --git a/sbatch_4b284b84bc4seed4.sh b/sbatch_4b284b84bc4seed4.sh new file mode 100644 index 0000000000000000000000000000000000000000..35841e20c5d96decf1bb29dc2e4fd80a3fd8e916 --- /dev/null +++ b/sbatch_4b284b84bc4seed4.sh @@ -0,0 +1,164 @@ +#!/bin/bash +#SBATCH --exclude=nid007571,nid007112,nid006774,nid007502,nid007506,nid007507,nid005145,nid006692,nid007218,nid007123,nid006124,nid006123,nid007496,nid007237,nid006852,nid007206,nid006947,nid007212,nid006977,nid007222,nid005444,nid007219,nid007493,nid007221,nid005300,nid005619,nid006118,nid005203,nid006113,nid006481,nid007077,nid005208,nid005207,nid005879,nid005901 +#SBATCH --nodes=32 +#SBATCH --ntasks-per-node=1 +#SBATCH --cpus-per-task=40 +#SBATCH --mem=256G +#SBATCH -p standard-g +#SBATCH -t 48:00:00 +#SBATCH --gpus-per-node=mi250:8 +#SBATCH --exclusive=user +#SBATCH --hint=nomultithread +#SBATCH --account=project_462000119 +#SBATCH -o logs/%j.out +#SBATCH -e logs/%j.err + +VARIANT=4b284b84bc4seed4 + +# if run without sbatch, invoke here +if [ -z $SLURM_JOB_ID ]; then + mkdir -p logs + sbatch "$0" + exit +fi + +set -euo pipefail + +# symlink logs/latest.out and logs/latest.err +ln -f -s $SLURM_JOB_ID.out logs/latest.out +ln -f -s $SLURM_JOB_ID.err logs/latest.err + +KILL_SWITCH_PATH=kill-switch-$VARIANT +CHECKPOINT_PATH=checkpoints_$VARIANT +TENSORBOARD_PATH=tensorboard_$VARIANT + +# Data +VOCAB_FILE="gpt2/vocab.json" +MERGE_FILE="gpt2/merges.txt" + +TRAIN_DATA_PATH=train.txt +# "train: 1.0 0:1 /scratch/project_462000119/data/c4/gpt2tok_c4_text_document" +VALID_DATA_PATH=val.txt +# "validation: 1.0 0:1 /scratch/project_462000119/data/c4_validation/gpt2tok_c4validation_rerun_text_document" + +PP_SIZE=1 +TP_SIZE=2 + +MICRO_BATCH_SIZE=2 +GRADIENT_ACCUMULATION_STEPS=1 +WORLD_SIZE=$((SLURM_GPUS_ON_NODE*SLURM_JOB_NUM_NODES)) +GLOBAL_BATCH_SIZE=$((MICRO_BATCH_SIZE*WORLD_SIZE*GRADIENT_ACCUMULATION_STEPS)) + +# Model parameters +source model_params.sh +MODEL_PARAM=("${PARAM_4516M[@]}") +NHIDDEN=${MODEL_PARAM[0]} +FFN_HIDDEN_SIZE=${MODEL_PARAM[1]} +KV_SIZE=${MODEL_PARAM[2]} +NHEADS=${MODEL_PARAM[3]} +NLAYERS=${MODEL_PARAM[4]} +SEQ_LEN=2048 + +echo "Model parameters: d_model $NHIDDEN ffw_size $FFN_HIDDEN_SIZE kv_size $KV_SIZE n_heads $NHEADS n_layers $NLAYERS" + +SAVE_INTERVAL=10000 + +# Tokens: 84_000_000_000 +# -> Samples: 41_015_625.0 +TRAIN_SAMPLES=41_015_625 + +OPTIMIZER_ARGS=" \ + --optimizer adam \ + --adam-beta1 0.9 \ + --adam-beta2 0.95 \ + --adam-eps 1e-8 \ + --lr 2e-4 \ + --min-lr 2e-5 \ + --lr-decay-style cosine \ + --lr-decay-samples $TRAIN_SAMPLES \ + --lr-warmup-samples 410_156 \ + --clip-grad 1.0 \ + --weight-decay 1e-1 \ + " + +GPT_ARGS=" \ + --num-layers $NLAYERS \ + --hidden-size $NHIDDEN \ + --num-attention-heads $NHEADS \ + --kv-channels $KV_SIZE \ + --ffn-hidden-size $FFN_HIDDEN_SIZE \ + --seq-length $SEQ_LEN \ + --max-position-embeddings $SEQ_LEN \ + --micro-batch-size $MICRO_BATCH_SIZE \ + --global-batch-size $GLOBAL_BATCH_SIZE \ + --train-samples $TRAIN_SAMPLES \ + --vocab-file $VOCAB_FILE \ + --merge-file $MERGE_FILE \ + --clip-grad 1.0 \ + --kill-switch-path $KILL_SWITCH_PATH \ + --bf16 \ + $OPTIMIZER_ARGS \ + " + +OUTPUT_ARGS=" \ + --log-interval 10 \ + --save-interval $SAVE_INTERVAL \ + --eval-interval 1000 \ + --eval-iters 100 \ + --tensorboard-dir $TENSORBOARD_PATH \ + --tensorboard-queue-size 5 \ + --log-timers-to-tensorboard \ + --log-batch-size-to-tensorboard \ + --log-validation-ppl-to-tensorboard \ + " + +ZERO_STAGE=0 + +mkdir -p ds_configs +DS_CONFIG_PATH="ds_configs/$SLURM_JOB_ID.json" + +cat < $DS_CONFIG_PATH +{ + "train_micro_batch_size_per_gpu": $MICRO_BATCH_SIZE, + "train_batch_size": $GLOBAL_BATCH_SIZE, + "gradient_clipping": 1.0, + "zero_optimization": { + "stage": $ZERO_STAGE + }, + "bf16": { + "enabled": true + }, + "steps_per_print": 2000, + "wall_clock_breakdown": false +} +EOF + +DEEPSPEED_ARGS=" \ + --deepspeed \ + --deepspeed_config $DS_CONFIG_PATH \ + --zero-stage $ZERO_STAGE \ + " + +CMD=" \ + Megatron-DeepSpeed/pretrain_gpt.py \ + --tensor-model-parallel-size $TP_SIZE \ + --pipeline-model-parallel-size $PP_SIZE \ + $GPT_ARGS \ + $OUTPUT_ARGS \ + --save $CHECKPOINT_PATH \ + --load $CHECKPOINT_PATH \ + --train-weighted-split-paths-path $TRAIN_DATA_PATH \ + --valid-weighted-split-paths-path $VALID_DATA_PATH \ + --data-impl mmap \ + --seed 4 \ + $DEEPSPEED_ARGS \ + " + +echo $CMD + +echo "START $SLURM_JOBID: $(date)" + +# bash launch_srun.sh $CMD +srun --label launch.sh $CMD + +echo "END $SLURM_JOBID: $(date)" diff --git a/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674658724.nid007239.26287.0 b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674658724.nid007239.26287.0 new file mode 100644 index 0000000000000000000000000000000000000000..b03975b7a978ac8cf9672846188ba7ab3c53eb7f --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674658724.nid007239.26287.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9d86952b6bd9b66e9045f14c31b0830628ff01b5280790625cf457657ad1eb8 +size 91495950 diff --git a/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674831652.nid005137.1007.0 b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674831652.nid005137.1007.0 new file mode 100644 index 0000000000000000000000000000000000000000..04fbf97142f335f33a503a203c78d4b6f523aa9d --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674831652.nid005137.1007.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f61c2a714fd0d4e8e938c42d43e0bc994cf623acdbe977ffc37588383fdb306b +size 54127334 diff --git a/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674917202.nid005381.81963.0 b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674917202.nid005381.81963.0 new file mode 100644 index 0000000000000000000000000000000000000000..aa8cc01b6f7e1232bd239e2c1756921b597d0528 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674917202.nid005381.81963.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3a7dbd43f6cce93c7a13e1bf9a69c4e2c866cf9745933ef9f89ff8a5112017a +size 40 diff --git a/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674919168.nid005381.100825.0 b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674919168.nid005381.100825.0 new file mode 100644 index 0000000000000000000000000000000000000000..183b372aab47973d010db9c5a5780461aea1b142 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674919168.nid005381.100825.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a46928e25109972d2dda9686ebb977f1daf56a30c3b9ae0dfc77e297ab794b3 +size 40 diff --git a/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674921113.nid005381.117540.0 b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674921113.nid005381.117540.0 new file mode 100644 index 0000000000000000000000000000000000000000..845be08b4de00201ce6a207192ee1bbebb3265d6 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674921113.nid005381.117540.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b63fd4458523f1f773d2f55774fa31623cf7430b9543bfa2385b6f85b243e759 +size 40 diff --git a/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674923054.nid005381.3574.0 b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674923054.nid005381.3574.0 new file mode 100644 index 0000000000000000000000000000000000000000..339f6f5518d38e9264683f1237fdfe100692d4f4 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674923054.nid005381.3574.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78665e4eea073089cf01cfa3cef04d042260aab75288a88376b60c13f3e1e019 +size 40 diff --git a/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674925012.nid005381.20606.0 b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674925012.nid005381.20606.0 new file mode 100644 index 0000000000000000000000000000000000000000..ab1201700cf5f423dbc38e9b09a3aab9a0748aed --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674925012.nid005381.20606.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bb75b30de22a532036e8ec272b42b92984b603b321d531963c10c9c4c6a5529 +size 40 diff --git a/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674926965.nid005381.36913.0 b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674926965.nid005381.36913.0 new file mode 100644 index 0000000000000000000000000000000000000000..d847cb24d06e9eaad8630f2f1aeb99703119f66c --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674926965.nid005381.36913.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38f018dc9b6721cd1c97633be51edd98180a1868120699bca1b9b71cbb2f61ad +size 40 diff --git a/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674928881.nid005381.53540.0 b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674928881.nid005381.53540.0 new file mode 100644 index 0000000000000000000000000000000000000000..d7327f1b9b9becdc0e5454626f1ab17a20ba47a4 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed1/events.out.tfevents.1674928881.nid005381.53540.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b37c27adc61acf84459451d2d64cf2973d2b8384b63a0dec12ebf5da045e4be0 +size 40 diff --git a/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674658764.nid006937.11253.0 b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674658764.nid006937.11253.0 new file mode 100644 index 0000000000000000000000000000000000000000..8e4b735e652856513bd6e79e4a57c86ca350cebe --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674658764.nid006937.11253.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:782bfb2f3bfd38cb15051eedb2bfa098db9331c1cbb95f71a607406ee2d68133 +size 92490539 diff --git a/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674831652.nid005727.105506.0 b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674831652.nid005727.105506.0 new file mode 100644 index 0000000000000000000000000000000000000000..e6c78aa1f8e00341eb92fddb48be2585d9b42237 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674831652.nid005727.105506.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fbfea9b4912d8210859f8ee97e6be4274f45c68add106bf138a7152fcd9e29c +size 54127334 diff --git a/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674917202.nid006075.61654.0 b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674917202.nid006075.61654.0 new file mode 100644 index 0000000000000000000000000000000000000000..18ab581769ee08cc0867082e3db06399afaf5a28 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674917202.nid006075.61654.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e557d21c54385dde64932607180a513684e499a03606aaec9cd7879e21b154d5 +size 40 diff --git a/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674917801.nid006075.69973.0 b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674917801.nid006075.69973.0 new file mode 100644 index 0000000000000000000000000000000000000000..390e6ef61b709b4dd02ece2f27700e2a196150d2 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674917801.nid006075.69973.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cadf338418540a3766280edb2b6227253d1de4bacd044694ab1675f12131b75c +size 16424 diff --git a/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674918036.nid006075.75226.0 b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674918036.nid006075.75226.0 new file mode 100644 index 0000000000000000000000000000000000000000..230f8ecb1a8849c0e3bbd2e27154394682e94e2b --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674918036.nid006075.75226.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d63faeddfbf58f240698c74f3ca15f9bd8b81779bfd5e02cd14c3a5a269903de +size 16424 diff --git a/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674918303.nid006075.82930.0 b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674918303.nid006075.82930.0 new file mode 100644 index 0000000000000000000000000000000000000000..e02603133bd0be4639516beebbee8d50badcb6b7 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674918303.nid006075.82930.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad2e61c2572614f14d37b0af825b39741fbba412f879642c9248f95ce71e7708 +size 16424 diff --git a/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674918527.nid006075.88110.0 b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674918527.nid006075.88110.0 new file mode 100644 index 0000000000000000000000000000000000000000..6e489f59e2b6a26da5638046a8ac75df6cdd914d --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674918527.nid006075.88110.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d18083916420a216a7a3037f5ac5ccfa502110de02bb3f197e1ee9cd76fd9d5f +size 16424 diff --git a/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674918717.nid006075.92841.0 b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674918717.nid006075.92841.0 new file mode 100644 index 0000000000000000000000000000000000000000..60ab114440d66782c02e00ec0440d164a19d9969 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed2/events.out.tfevents.1674918717.nid006075.92841.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36cbd272a17b0db192030c083ba2917d25472a599e6ca142bcbcfd76072ea610 +size 16424 diff --git a/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674658903.nid007236.26010.0 b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674658903.nid007236.26010.0 new file mode 100644 index 0000000000000000000000000000000000000000..2e6ffaed79b6683796a6ccf655a61851b17b183a --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674658903.nid007236.26010.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58fb4e38f34503b1e9f13d8957bb01f1e82a099148bb434af602f7234db8c724 +size 93843615 diff --git a/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674831691.nid006477.1824.0 b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674831691.nid006477.1824.0 new file mode 100644 index 0000000000000000000000000000000000000000..452e36bb044a771945b529dd2c96e67c91d0979c --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674831691.nid006477.1824.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f10c99e2f3191b05f83e1293ed60e043dadfea6f8b396c9ac672242f61c1239f +size 54127334 diff --git a/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674918939.nid006075.98165.0 b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674918939.nid006075.98165.0 new file mode 100644 index 0000000000000000000000000000000000000000..37b483841f598279eb4fa245947618056470a947 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674918939.nid006075.98165.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee320d3a4272b6069b6a5fb939bcbe016f711216c6d76976ce57a02cabef049b +size 16424 diff --git a/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674919168.nid006075.105880.0 b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674919168.nid006075.105880.0 new file mode 100644 index 0000000000000000000000000000000000000000..b2c790492050df407cfa595247e4d2f487a000bf --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674919168.nid006075.105880.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c46ca9c83c87e7dcc8103e5d0abdd82d51370090ebd85704944e8f9bb664640 +size 16424 diff --git a/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674919385.nid006075.110638.0 b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674919385.nid006075.110638.0 new file mode 100644 index 0000000000000000000000000000000000000000..30abb015c3d28c6c5285676a9ad0920e8e2ffa35 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674919385.nid006075.110638.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edd95bcf43b1cdc033fafbaf719e9c8ce8fb128ab570b711ca9fb3adaa53b37d +size 40 diff --git a/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674919856.nid006075.116393.0 b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674919856.nid006075.116393.0 new file mode 100644 index 0000000000000000000000000000000000000000..4130d8b10167b80c45cdccdca63197fcf6afb83b --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674919856.nid006075.116393.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac9aaac51e131d9b7328835d5e5ad6322b0df9c1456095d391d7904dc200ee0e +size 16424 diff --git a/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674920043.nid006075.124089.0 b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674920043.nid006075.124089.0 new file mode 100644 index 0000000000000000000000000000000000000000..5017355768488b99cb0257f69956a9bba40ca124 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674920043.nid006075.124089.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1114a1251c41af9358453d820e2653403cd65f4adcacd144612be622345c92a5 +size 16424 diff --git a/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674920233.nid006075.128804.0 b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674920233.nid006075.128804.0 new file mode 100644 index 0000000000000000000000000000000000000000..75c1fc6eb01a670548d0ad05d9f260b7ade58178 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed3/events.out.tfevents.1674920233.nid006075.128804.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03b8e78978f9be74bc8761c25719da9dff51a684cf1b4372b2bf09965928064d +size 16424 diff --git a/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674658792.nid006915.36949.0 b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674658792.nid006915.36949.0 new file mode 100644 index 0000000000000000000000000000000000000000..770e7f60e5089bd4b13bdda0e62db98480e07f9a --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674658792.nid006915.36949.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f48f92df81f00397bdd5b37de3ea7e3d304fcde81ee650891e9ced34a5bb311e +size 83323638 diff --git a/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674831652.nid006201.114021.0 b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674831652.nid006201.114021.0 new file mode 100644 index 0000000000000000000000000000000000000000..fe9c5e123936d012f2e47801f497e26741f55d95 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674831652.nid006201.114021.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40fb6233f8db18908137ac3ee02072b9ec9520bf561ea060e725f5794730d52c +size 72098194 diff --git a/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674948893.nid005588.30817.0 b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674948893.nid005588.30817.0 new file mode 100644 index 0000000000000000000000000000000000000000..7adf7f94214e5171d291f4e301674b3764830e6c --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674948893.nid005588.30817.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f3e6cf4e5124057edda8fcbd0d1a043325c103f7578904b72b1c7794028ff11 +size 16424 diff --git a/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674949121.nid005588.36807.0 b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674949121.nid005588.36807.0 new file mode 100644 index 0000000000000000000000000000000000000000..d1b09ae0180aacdd72a5e97f608429572e5cf318 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674949121.nid005588.36807.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78c24460cccb384894a4f48211f8fb9ad91bed060e3f6841e285b64a5d4bb36e +size 16424 diff --git a/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674949320.nid005588.42425.0 b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674949320.nid005588.42425.0 new file mode 100644 index 0000000000000000000000000000000000000000..c861dea2a67eb258c62be1d334b2fd78c6394660 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674949320.nid005588.42425.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ab58b189252c153985afd24cbc81081516270836da63275b2bb15b1af375bd4 +size 16424 diff --git a/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674949467.nid005588.47434.0 b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674949467.nid005588.47434.0 new file mode 100644 index 0000000000000000000000000000000000000000..802a98b7c64bb0c30a262705b2feecfd5e25e530 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674949467.nid005588.47434.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a15c1527585ccc7c50835d40f9db4c1c33bf797c09d571babe00a81dcafdafc +size 16424 diff --git a/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674949636.nid005588.52938.0 b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674949636.nid005588.52938.0 new file mode 100644 index 0000000000000000000000000000000000000000..faf9a2529a091542b3f33977062e947335a87f66 --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674949636.nid005588.52938.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d3acd0d0de0f0e0fa5ef2d7337966b0d681c41561a0fec81683070666f90d59 +size 16424 diff --git a/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674949805.nid005588.60510.0 b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674949805.nid005588.60510.0 new file mode 100644 index 0000000000000000000000000000000000000000..c6e64b7427a8483fe30226a0937a048cea93aa5e --- /dev/null +++ b/tensorboard/tensorboard_4b284b84bc4seed4/events.out.tfevents.1674949805.nid005588.60510.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:146d272cf3d26ae589369f4fee5f1ef579184bcf719eb930f786105738e8515c +size 16424