diff --git a/.gitattributes b/.gitattributes index c7d9f3332a950355d5a77d85000f05e6f45435ea..b35067910d48afec0ee4685e52415477e48d881f 100644 --- a/.gitattributes +++ b/.gitattributes @@ -32,3 +32,99 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..03e0cc4018f1c72a215319cccee203b2f5f34e9e --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.31005545889675595, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.024221663303322493}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06333959745402563, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017129657332336005}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2660634003689691, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004758664963766919}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09455536275767198, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020202782477753084}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.02992387161371905, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010678757643085887}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.13162654248190145, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003224162069371238}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.045045993698642706, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012585799900103791}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.061154332270835166, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015925366548222631}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.26067769163704907, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004663300404214987}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09174293269832776, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018940760825308196}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06064250474249417, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001621939447674481}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.25579533250119046, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004509656638017682}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.0906091189082405, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001901338184221523}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c7a1e3e3250dd4569c9832b5a6d7b293be6220ea --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3253498336709165, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03212142507533847}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.060918256661001154, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001387907396461889}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3063168556661825, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005105195108996422}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09469312150361009, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001863178804950363}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.027316953543545387, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008360022968447658}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1391741163483647, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032268292328296168}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.042453810034119334, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001154483862783651}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05742537248926894, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012621921122595368}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2883872431662452, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004673161214630172}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08927770465065916, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016929550946172228}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.058015541222877484, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013118024160571136}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2900074000424914, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0046821199593389245}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09008895599436548, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017491206522219078}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..9ba4ad9b38c62c9d4a84e5de77f53828394d2143 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.31791276568975185, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02727147856829631}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.05962717338634471, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00126061681638203}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.30756287355829814, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004889305792734938}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09336715846217024, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016996772402870365}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.02670280090842877, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007604338404443195}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.14249676402659822, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032896138546168476}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04191645296449831, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010709241966443265}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05627058448383118, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011470016078651416}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2896458162973523, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0044554794302764}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08815984465580837, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015470326777333359}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.05706756866828331, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012020871707703095}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.292251335959323, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004510651275741409}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.08926200923694406, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001613762141288785}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..51aeec59ceef2306cf559736dcf3e17be89c1766 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3212440432130126, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02833396914504117}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06018320328990788, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012792421021156602}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.31701882107369783, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004918042604954739}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09437325152413317, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016293117647949373}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.02718506309171944, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000834511570552857}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.14788498862069166, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0033325099175022747}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.042391214062896254, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010316080252432995}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05656198333950361, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011649029158652883}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2959773638751678, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004411378256218955}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08870171226199733, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014934510170629485}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.05732291421825896, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012233313963698896}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3008574516119203, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004550770798562808}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.0897987691484568, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015399085797828443}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b39fedaf7271f205bea213abca5ce0cf14659299 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.34701320585063394, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.012982772867681795}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06139220025240579, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001204641896215659}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.32370589082989293, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004818041311873955}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09652792542278772, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0015764734075382092}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.027393636493786414, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007666521742975135}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.15165230865373422, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003290995473977093}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.043124737274736084, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010143599611912326}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.057858738343212236, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011371996173128948}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3014171252596505, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004324422192213472}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09083921184905662, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014744271896824609}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.05856942284861244, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011580171724704853}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.30659074236282113, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004443465919036145}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09197412784787223, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015015595131035856}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..9c62905bbc183d94701ecea86e2ca435d4b60e76 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3826134137609412, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.027260987836796497}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06210934649298242, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0011637172836219596}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.32987573012277627, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0048175275958975364}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09769981149870674, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0015568330004171944}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.027334516755102147, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006792346244010215}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1540494964221242, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0033061515191188284}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04331193468813116, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009723654636517451}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.058131690562405976, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001071674347816923}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.30470149207947667, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004224186135139794}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09131104015906616, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014304797258199975}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.05908274659378142, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011102880375707994}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3110966005686351, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004419284614315986}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09280326127954946, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0014767682135790052}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..dc0b30725524b580e7da306ddb9a05751001ed25 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1444356353252771, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018890228924276567}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.24333387644429813, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026067622578618776}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.16854478548066482, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018569277613818772}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.029280987606291494, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007237627275927142}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05112009572683697, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001337818306117227}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.034308638506432475, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008125402811211317}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11294853294767912, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013180107899456023}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.19771034044326136, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002117097962875754}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13358205180049998, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013364507319559807}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13255355115964793, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017152326851252678}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2246765687186434, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002420653997148166}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1549132489748441, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016876295948321293}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.4836403082580132, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04275891251756906}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..e74fa9c18518741d45554d8576a085a23b7db0eb --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.14337611363324493, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017975787265801645}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2401884909277128, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002577850850716675}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.16619267944887964, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001744164720654144}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.024778664535770947, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007555235233701629}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04385427041760851, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0013655854605521512}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.028880049821475656, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007891070933473794}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10397637743893304, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001235246358495789}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.18006724988321413, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0019906559738365613}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12166495381666467, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0011944014882187845}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13419081390261864, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016722655575097506}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.22568787667911147, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002430850770097226}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15572261717667488, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016216939170534584}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.368798582263273, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03762251064773447}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2dd1e7dfcd9f8bafed434f682161f3ad3b84e0c6 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15063044447280027, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001940763130936743}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.23931115978829579, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0024971943832608266}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17019067213369107, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017690889374743603}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.029664097877505877, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009118238978394307}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04760945326052988, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001306711433850517}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.033005228021297704, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008241949468737384}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11542835667429227, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014439177169422246}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.18791535392357211, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.001981689065390633}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.131223027742424, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012757407637194174}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.14098071498465764, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001813064708734854}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.22467978591395918, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023443476592751983}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15936229418185377, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016407771888788867}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5622860462600348, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.043740854824911794}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..be1dd61c0cec8e23a9b2d30baccf76154202ec17 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.13853097159476044, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0024033845722523724}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2022241539975303, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002895744315329479}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1459775119747986, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002013820231047812}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.027922753485106568, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010069321667728792}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.041810329656802245, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00129627924231701}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.02907493824937833, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008064371846682719}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10946213334283154, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019316172770680437}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1624038367425624, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023444744969795006}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.11526184202559941, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015132431316080114}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1294243469444916, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0022694744228463435}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.18910016521383136, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027080908132011243}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1361503335550405, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001865935511568599}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5234316086072492, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04994760816269213}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..33397b2478c53374e44d67b02eb73fbe59bc6de1 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.048283116115591836, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018762804337576465}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.07012389259959088, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0024827186502375275}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.04937920113316496, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017006423976957319}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.009647802697589025, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006103768053178551}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.015261115214929618, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0009960688572823394}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.010104805168030258, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005574344481643184}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.039482927106928814, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015510440139044537}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.05812150365824274, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00207507825756795}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.04024639157961486, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013631991023636098}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.04495702046511921, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017562417792707258}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.06533375820468378, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023195859576008596}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.045827471133389246, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001572714794925252}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.41252863907826776, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.030373767513404697}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..508d6c33a39429710e1a6c151e520cafe736a546 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.008053948401330599, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008246264662235712}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.011572381851776472, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0011296167548172531}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.008092466035741461, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0007725180183102787}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0016487162145299862, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00028855076065369416}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.002359034970945986, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00033523534751396603}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0016583152317218213, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00024030776163960353}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.006581900525062106, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006767336687555497}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.009604072556401588, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0009440395007256133}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006591147101382126, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006203194340556792}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.007446672471389, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007645726188902775}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.01074764632172318, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0010438920929096284}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.00747305417348784, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.000709782509687814}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.1512232954144342e-06, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 2.094932653320538e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..cf353e084b59e955fb84f2515344d6a527b5aab5 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.7454534998692752, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07804428323713496}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.06474609956563113, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002808015303613375}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.0348307362954131, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0014091894165256253}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.03918099607350703, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001448534494550284}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.016683043975980968, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0014447318755830502}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.007670856047129852, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0005580500848436268}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.008523314750914139, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00063055748185768}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.05551189449248439, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00238259584939437}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.03040510241026872, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0012245380288356473}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.033916243277006014, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001231432823341605}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.054968825384225664, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0023305151110030124}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.02911562853755617, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0011623178626526266}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.033158173617653046, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0011976728573487477}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..9404154ea7d6191dd4e9449a77bdba19652fe32e --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.487694889793941, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07555119011558427}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3097058053229197, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002851087946324211}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.43110365850951743, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002732778963977049}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3321953827037549, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020364301991294543}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.12287476036716052, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0016877708444218635}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.17280953287169348, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019134667041499913}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.13126151027829455, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001411164906927139}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.22519107207919958, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002044768338085085}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.32069030400568344, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022416724958190157}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.24346830553368265, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014712983587429052}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.25598458046409817, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002501331832178447}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.35721132057108596, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002561727405040063}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2746466676619327, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018777824275120166}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..9bdd337aadfd56c516d76efa952a0df5a403e780 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.079188977413186, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09602875924306557}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3181407194694957, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0029777295615160512}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4561708867688496, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026452494137559723}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.346570361859306, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002052145530841731}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.13642028395369205, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0018950492351855646}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.19647624995791846, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019636015048637256}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.14693316116112215, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014445847251510187}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2315672124269367, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002127274716028904}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3415431295705076, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022584378328241905}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.25482744735128565, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014755904280259592}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2655109833740872, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002636322289847473}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.38142593418332454, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002536630793778901}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2890174556326334, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018995638277943165}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..9f6f0b8e5e55fbab9cca7426a3406a6cefe66eea --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.439720663780092, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09057671754019295}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.33806886805387837, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031451949821916397}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4597540434384101, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025911053727046204}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.35966978129457794, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020809245391192944}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.15002040777811748, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0019728388177885454}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2046175785902067, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001988761577155802}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.15787398183922485, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00151813234143548}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.24363492051808863, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0021801249774331755}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3434646349475326, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00230667877920879}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.26303596646553673, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001522516609384217}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2803542384188989, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002777229104092061}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3816738562894357, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025233042461889513}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2981457337030485, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001964234489421683}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..15f73a14edde93d855565b72d73c5ff5ba61c847 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 3.9189279109719335, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08586279820080885}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.39213707891049004, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003422529928577996}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.44238533983355405, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025751632202055024}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3836182432795783, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022054074783422308}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.17932569557247965, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0021875288020798776}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2014446351152472, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001986701156425044}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.17345256590048624, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001662967964824317}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2822423599102126, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002501678088025689}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.32790464597969743, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022994271661774903}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.27924589416548823, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017055264106925416}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3236183940771683, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030448679972683726}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3650546853387208, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002486300924606491}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.31650257132624704, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002105427772389244}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..7868610dc72f2952367a338897a3d6b1f737f05d --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 3.0686372723608897, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06784266491877249}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4502554374503682, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0033630982834692595}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.42945542013401933, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002595990607765447}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4095857053929965, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021530995714477558}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.20886191169135895, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0023179990401586887}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1967893746603374, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001931221479807446}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.18712397033462674, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017078080439781192}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.32145296922919064, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0025789465971034213}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3125724382034645, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002290959462627688}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.29430723400568193, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001762954764782701}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.36887628081177687, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00302325518602794}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3523561197227813, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002466960449053646}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.335707785812935, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020851385129732505}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_0.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..491c54a719c1e1bda50d1fe7ac2162e80d7680a8 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.13656588620899038, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00174226154738388}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3323235396298205, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003846536397189559}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.19123744824446468, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022992268247988583}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.025701014397443208, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008822864860028765}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06451842393614433, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022307575351008177}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0362962242227074, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012357989639325655}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10175956050352102, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012156226058548923}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24958177981302834, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0028231998096754063}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14272621341641745, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016087589844111059}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.1074311808382226, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014050024971339861}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2636816826721476, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032819789427964595}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.15074429962396632, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018801101946759444}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.3841560907125259, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07797827326949171}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_1.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..b3912952b73304c14bd41881ee62d07aea8d44b9 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.10551189065335231, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015632545047201442}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.26396369315037715, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0036356422465613878}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1490109968360671, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021151321607124005}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.015258372576455077, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007194850115847547}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0401042986262725, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019569862879314013}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.021870860381131174, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010335421346335594}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08322301164562862, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011487703143784498}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.20979036419712682, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0028033758287091875}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.11776037181510428, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015663569819055773}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.08413103520980872, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001254290848777802}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.21222983148038477, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00304896385565602}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.11905956031628537, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017138611513238453}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.7666050226687372, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06474629405034218}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_2.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..49193132a1e72cbe023ed4e66c3268dea4acc588 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.10715846509597497, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015697108273323291}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2695418218368475, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0036206648240501645}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.15152826480726653, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002114221677973485}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.01667569031887618, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007375139406724271}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.043570635275517515, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019441097483278629}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.023831872627776102, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001048493003352801}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08504138318382073, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011733846471463298}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.21610444539656637, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002873607280157199}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.12053707825720893, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015925749869109209}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0856088008772477, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012678716431980997}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.21768648734893284, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003115267847510722}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.12141179293846815, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017373975644363541}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.8345839792934845, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09663801407092908}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_3.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..f96c3de54e30824e5fe7a354216a07b930c0a492 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.10606297790246366, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017854168680511101}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2559365393746863, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003942828057917467}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.14641419405475198, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022626874492042907}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.016403947053914306, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007741120118238733}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.04155268993757446, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002004912080845838}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.023068148270822337, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001082001329317035}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08438433169380888, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013959138179342146}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.20443934586419923, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003127827147724924}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.11651320027532101, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017495857212361317}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.08473700150035146, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014635025254577177}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.20585072949190508, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003317649942197773}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.11708695716505582, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018525946257683778}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.9311539798670635, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09107540142081379}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_4.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..09832432e2b465a53545bf5e4783de59889634f8 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.033538556464056984, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002282970207590659}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.061278166608827844, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0035032648267361863}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.03857476484604358, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002181373104120625}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.00356863909695226, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00043019877312427664}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.007827354388277672, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.000890140246104386}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.004640907524463805, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000536562366213917}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.026997141398160576, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001907201107733291}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.049289096496901386, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0027778936304874483}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.03084447504069215, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001708948915334388}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.027395316222004706, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0019605932238404397}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.04960704068168692, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002857971818835903}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03116504304791766, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017650576678384076}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.41043347346219244, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1486020805997744}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_5.json b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..a894652f4e09647fbe03abf932673b1c2ff9188d --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/agg.1b121b21bc4seed1_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0021237847249880666, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0005810244101355184}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.00177754327837735, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00048757744409275904}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.0018825860372170817, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0005105425641834596}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.00019654088050314464, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00015261564209740738}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.00019511149228130362, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00016439589503089688}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.00019318274102930717, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00015698812424376165}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0017497614736063241, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00048095662458468534}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.001513011919166749, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0004307689764831507}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0015759792816185546, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00043710297005663255}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0018510098059867322, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.000507889962370857}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0016014978567092907, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0004541344456295751}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0016704094537401807, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.000463071140217582}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.7812749842983558e-39, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 6.173625004905157e-36}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..80cb363dc32d480cace84c6eae96eb9b8b1cd9a1 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d2121fd7f3724009e7ea41015d9066c04de5a71019016e2c88766323e4f1df +size 4123649 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ee8fa0c97f6f23681a5d1c610c27a19645157b85 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d7007c7371cd9fe64ee37a70279b12f4f1d9a047ef4a21cc1688f5ed96abddb +size 5156023 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b864d69946dbeb8e21be87b17b4d0ab6919157ac --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f04e15e5a56936bb29d1f701c0fc4f42f3781e522f6013f5673a7170ebbdeb37 +size 6059579 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c2f0809b522dfcc30196ab49c335dad0f168a703 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a0a94433b46fb67748db7e3067a1bdb3e42a2c30f3917054b1f86fbb8b4e0da +size 6971963 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8919a70fb90b58f4ad1524a626c17c811771d293 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d0000fdf72acf9c7bfde400b8f82e580ac264fa2bc2c81fc406f3e9e7fef99a +size 7866268 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8ff9311a1158f248e029a04dd9507f1740d82690 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01d7ba121fbedb1fc5c3fa8ad0a5c0ee6580f91976bc66f4fa3a1d09884c3ecf +size 8766808 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0b19d11de527c3200fd103075f5c769ee8b7bfa3 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10dbe0aaee41795ac2665a9ed3481d49352ed90545785cabe0a85ee84c627f80 +size 7698478 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e03ca10e62832a2e64e9cd8054bdd91799cb7367 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9db705c89e34daa1669de250a077979df0895609b251906ce12cf2b6845e6a7 +size 13335999 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..704dae3676784032f587476a37bf07c2c04544c2 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:588cf19d11278365c136ef6d62d4ef5930cfd748f888f0868b3287c2e042ba6b +size 18917998 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7fa630d6a7fcf1228f310a7b78ff19c590e271b8 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bac89f6dd45fa32455fa106fe919fcb85fac76a97f3c5756e335bc886961e114 +size 24325302 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3f581a6bd2a50bb683f647460e86d4c21cc6532c --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2418597903481fc954521c8cea44736d269eee63b05cc1aba40c2364e0faffcc +size 29469238 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f2ccdbf3ab26d2b1fa21398b113c354f118f49bd --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd2e0236b53e3090e6c13b7740ce6fe276f5fe22308bbd439d1131d767e53109 +size 34799439 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..cba88b02c0bf495b6c4d506e84725d2d04b25128 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b4ab57ce200ce0a8393da5290df3ab47a9b91ab52504229f05d75fd8425dfcf +size 3813663 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..cad55e93c076d06795e4edb4f6163660ea7741af --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0de2526a87c8622c5d8d62a9ce057c15761545b2e0c8f25e6a4da518554a9ebe +size 5359955 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7d0c06d92c3c0b85b072ecb1d87fe5bd2c09ee36 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee5fdfde40f31fa51cb0ccb8e5e71a9b17baf575f1e5eb3fa1f4d799b96ba605 +size 6464952 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d0a812b40de36ade6fa5e47dce465b0ed28aa451 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:010e9d4097723769c56d4bd97ca744d9d1b8254c934f666a621b54c1b3d9d83c +size 7546591 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5ce6fb857a5fee8f06efec50fc51fb864808012a --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8e49d09fff978c984df9f3e4ea61bfa79be6684838ac448bc7bb3cfe6dc4361 +size 8605770 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..388a103ebd33d1b7efca433bea6a73495fc61991 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9def1c8882a5671fe86a5540fdc61b48df44b8d65b3d96c5dd6b90b3726613c +size 9669732 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_0.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4fdf09928cfc7d08e07165eae9f9d9fcdbb8d2a2 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:795bbd7da9eb20795e79af938d1c94533f330fc91eaec95c8fd790f5b7f1afd3 +size 2838934 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_1.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6651c701a8ae27986168a3c4ef09a643b395308b --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9b2cbd90c27f8b737c60a80a46b8a5a9a05ed7ecc960607d85cb4d9f5e57df +size 5105192 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_2.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7150e0d075315f142eafa3fde6264979488d29cd --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d370f27abc098b77a7f945fe892ee504bc05d8624d65947b85bf44ba8e88da86 +size 7377387 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_3.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4e07bbdd4459cb0805e70697e08bb2b50f3a38ef --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8359ff8847bf5b3b599cdee13485e4133ef75bc0d7c035fd72bda8a79f72e8f +size 9647200 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_4.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6e759982bcc326c07d42fc62e67c4b238add593a --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3ea3521f01e837b06ad58355e744e06f01bfc7772e74cea3631eae0c703be66 +size 11672907 diff --git a/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_5.jsonl b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..189b6eec51beadff49a553def1143a4da27391ce --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/examples.1b121b21bc4seed1_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc427206ffdf7a115c525a593403a7ef67d520412f38f604be0e03238fa56d90 +size 13897443 diff --git a/1b121b21bc4seed1/evaluation/generation/merged.csv b/1b121b21bc4seed1/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..18e46a7c93f0c4ce0e8eab6e0600be2a945155ba --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.008523314750914139 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.008523314750914139 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.13126151027829455 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.13126151027829455 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.14693316116112215 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.14693316116112215 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.15787398183922485 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.15787398183922485 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.17345256590048624 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.17345256590048624 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.18712397033462674 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.18712397033462674 +e2e_nlg_cleaned,5,average,multiple,0.1341947507107781 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.0362962242227074 +gem_xsum,0,median,rouge2_fmeasure,0.0362962242227074 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.021870860381131174 +gem_xsum,1,median,rouge2_fmeasure,0.021870860381131174 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.023831872627776102 +gem_xsum,2,median,rouge2_fmeasure,0.023831872627776102 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.023068148270822337 +gem_xsum,3,median,rouge2_fmeasure,0.023068148270822337 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.004640907524463805 +gem_xsum,4,median,rouge2_fmeasure,0.004640907524463805 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.00019318274102930717 +gem_xsum,5,median,rouge2_fmeasure,0.00019318274102930717 +gem_xsum,5,average,multiple,0.018316865961321687 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.045045993698642706 +web_nlg_en,0,median,rouge2_fmeasure,0.045045993698642706 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.042453810034119334 +web_nlg_en,1,median,rouge2_fmeasure,0.042453810034119334 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.04191645296449831 +web_nlg_en,2,median,rouge2_fmeasure,0.04191645296449831 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.042391214062896254 +web_nlg_en,3,median,rouge2_fmeasure,0.042391214062896254 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.043124737274736084 +web_nlg_en,4,median,rouge2_fmeasure,0.043124737274736084 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.04331193468813116 +web_nlg_en,5,median,rouge2_fmeasure,0.04331193468813116 +web_nlg_en,5,average,multiple,0.04304069045383731 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.034308638506432475 +wiki_lingua_en,0,median,rouge2_fmeasure,0.034308638506432475 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.028880049821475656 +wiki_lingua_en,1,median,rouge2_fmeasure,0.028880049821475656 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.033005228021297704 +wiki_lingua_en,2,median,rouge2_fmeasure,0.033005228021297704 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.02907493824937833 +wiki_lingua_en,3,median,rouge2_fmeasure,0.02907493824937833 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.010104805168030258 +wiki_lingua_en,4,median,rouge2_fmeasure,0.010104805168030258 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0016583152317218213 +wiki_lingua_en,5,median,rouge2_fmeasure,0.0016583152317218213 +wiki_lingua_en,5,average,multiple,0.022838662499722707 diff --git a/1b121b21bc4seed1/evaluation/generation/merged.json b/1b121b21bc4seed1/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..23db7a126ddcd47aab3f0a009fe0f37a48e8ef65 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.31005545889675595, "bleu_stderr": 0.024221663303322493, "rouge1_fmeasure": 0.09455536275767198, "rouge1_fmeasure_stderr": 0.0020202782477753084, "rouge1_precision": 0.06333959745402563, "rouge1_precision_stderr": 0.0017129657332336005, "rouge1_recall": 0.2660634003689691, "rouge1_recall_stderr": 0.004758664963766919, "rouge2_fmeasure": 0.045045993698642706, "rouge2_fmeasure_stderr": 0.0012585799900103791, "rouge2_precision": 0.02992387161371905, "rouge2_precision_stderr": 0.0010678757643085887, "rouge2_recall": 0.13162654248190145, "rouge2_recall_stderr": 0.003224162069371238, "rougeL_fmeasure": 0.09174293269832776, "rougeL_fmeasure_stderr": 0.0018940760825308196, "rougeL_precision": 0.061154332270835166, "rougeL_precision_stderr": 0.0015925366548222631, "rougeL_recall": 0.26067769163704907, "rougeL_recall_stderr": 0.004663300404214987, "rougeLsum_fmeasure": 0.0906091189082405, "rougeLsum_fmeasure_stderr": 0.001901338184221523, "rougeLsum_precision": 0.06064250474249417, "rougeLsum_precision_stderr": 0.001621939447674481, "rougeLsum_recall": 0.25579533250119046, "rougeLsum_recall_stderr": 0.004509656638017682}}, "1": {"PALM_prompt": {"bleu": 0.3253498336709165, "bleu_stderr": 0.03212142507533847, "rouge1_fmeasure": 0.09469312150361009, "rouge1_fmeasure_stderr": 0.001863178804950363, "rouge1_precision": 0.060918256661001154, "rouge1_precision_stderr": 0.001387907396461889, "rouge1_recall": 0.3063168556661825, "rouge1_recall_stderr": 0.005105195108996422, "rouge2_fmeasure": 0.042453810034119334, "rouge2_fmeasure_stderr": 0.001154483862783651, "rouge2_precision": 0.027316953543545387, "rouge2_precision_stderr": 0.0008360022968447658, "rouge2_recall": 0.1391741163483647, "rouge2_recall_stderr": 0.0032268292328296168, "rougeL_fmeasure": 0.08927770465065916, "rougeL_fmeasure_stderr": 0.0016929550946172228, "rougeL_precision": 0.05742537248926894, "rougeL_precision_stderr": 0.0012621921122595368, "rougeL_recall": 0.2883872431662452, "rougeL_recall_stderr": 0.004673161214630172, "rougeLsum_fmeasure": 0.09008895599436548, "rougeLsum_fmeasure_stderr": 0.0017491206522219078, "rougeLsum_precision": 0.058015541222877484, "rougeLsum_precision_stderr": 0.0013118024160571136, "rougeLsum_recall": 0.2900074000424914, "rougeLsum_recall_stderr": 0.0046821199593389245}}, "2": {"PALM_prompt": {"bleu": 0.31791276568975185, "bleu_stderr": 0.02727147856829631, "rouge1_fmeasure": 0.09336715846217024, "rouge1_fmeasure_stderr": 0.0016996772402870365, "rouge1_precision": 0.05962717338634471, "rouge1_precision_stderr": 0.00126061681638203, "rouge1_recall": 0.30756287355829814, "rouge1_recall_stderr": 0.004889305792734938, "rouge2_fmeasure": 0.04191645296449831, "rouge2_fmeasure_stderr": 0.0010709241966443265, "rouge2_precision": 0.02670280090842877, "rouge2_precision_stderr": 0.0007604338404443195, "rouge2_recall": 0.14249676402659822, "rouge2_recall_stderr": 0.0032896138546168476, "rougeL_fmeasure": 0.08815984465580837, "rougeL_fmeasure_stderr": 0.0015470326777333359, "rougeL_precision": 0.05627058448383118, "rougeL_precision_stderr": 0.0011470016078651416, "rougeL_recall": 0.2896458162973523, "rougeL_recall_stderr": 0.0044554794302764, "rougeLsum_fmeasure": 0.08926200923694406, "rougeLsum_fmeasure_stderr": 0.001613762141288785, "rougeLsum_precision": 0.05706756866828331, "rougeLsum_precision_stderr": 0.0012020871707703095, "rougeLsum_recall": 0.292251335959323, "rougeLsum_recall_stderr": 0.004510651275741409}}, "3": {"PALM_prompt": {"bleu": 0.3212440432130126, "bleu_stderr": 0.02833396914504117, "rouge1_fmeasure": 0.09437325152413317, "rouge1_fmeasure_stderr": 0.0016293117647949373, "rouge1_precision": 0.06018320328990788, "rouge1_precision_stderr": 0.0012792421021156602, "rouge1_recall": 0.31701882107369783, "rouge1_recall_stderr": 0.004918042604954739, "rouge2_fmeasure": 0.042391214062896254, "rouge2_fmeasure_stderr": 0.0010316080252432995, "rouge2_precision": 0.02718506309171944, "rouge2_precision_stderr": 0.000834511570552857, "rouge2_recall": 0.14788498862069166, "rouge2_recall_stderr": 0.0033325099175022747, "rougeL_fmeasure": 0.08870171226199733, "rougeL_fmeasure_stderr": 0.0014934510170629485, "rougeL_precision": 0.05656198333950361, "rougeL_precision_stderr": 0.0011649029158652883, "rougeL_recall": 0.2959773638751678, "rougeL_recall_stderr": 0.004411378256218955, "rougeLsum_fmeasure": 0.0897987691484568, "rougeLsum_fmeasure_stderr": 0.0015399085797828443, "rougeLsum_precision": 0.05732291421825896, "rougeLsum_precision_stderr": 0.0012233313963698896, "rougeLsum_recall": 0.3008574516119203, "rougeLsum_recall_stderr": 0.004550770798562808}}, "4": {"PALM_prompt": {"bleu": 0.34701320585063394, "bleu_stderr": 0.012982772867681795, "rouge1_fmeasure": 0.09652792542278772, "rouge1_fmeasure_stderr": 0.0015764734075382092, "rouge1_precision": 0.06139220025240579, "rouge1_precision_stderr": 0.001204641896215659, "rouge1_recall": 0.32370589082989293, "rouge1_recall_stderr": 0.004818041311873955, "rouge2_fmeasure": 0.043124737274736084, "rouge2_fmeasure_stderr": 0.0010143599611912326, "rouge2_precision": 0.027393636493786414, "rouge2_precision_stderr": 0.0007666521742975135, "rouge2_recall": 0.15165230865373422, "rouge2_recall_stderr": 0.003290995473977093, "rougeL_fmeasure": 0.09083921184905662, "rougeL_fmeasure_stderr": 0.0014744271896824609, "rougeL_precision": 0.057858738343212236, "rougeL_precision_stderr": 0.0011371996173128948, "rougeL_recall": 0.3014171252596505, "rougeL_recall_stderr": 0.004324422192213472, "rougeLsum_fmeasure": 0.09197412784787223, "rougeLsum_fmeasure_stderr": 0.0015015595131035856, "rougeLsum_precision": 0.05856942284861244, "rougeLsum_precision_stderr": 0.0011580171724704853, "rougeLsum_recall": 0.30659074236282113, "rougeLsum_recall_stderr": 0.004443465919036145}}, "5": {"PALM_prompt": {"bleu": 0.3826134137609412, "bleu_stderr": 0.027260987836796497, "rouge1_fmeasure": 0.09769981149870674, "rouge1_fmeasure_stderr": 0.0015568330004171944, "rouge1_precision": 0.06210934649298242, "rouge1_precision_stderr": 0.0011637172836219596, "rouge1_recall": 0.32987573012277627, "rouge1_recall_stderr": 0.0048175275958975364, "rouge2_fmeasure": 0.04331193468813116, "rouge2_fmeasure_stderr": 0.0009723654636517451, "rouge2_precision": 0.027334516755102147, "rouge2_precision_stderr": 0.0006792346244010215, "rouge2_recall": 0.1540494964221242, "rouge2_recall_stderr": 0.0033061515191188284, "rougeL_fmeasure": 0.09131104015906616, "rougeL_fmeasure_stderr": 0.0014304797258199975, "rougeL_precision": 0.058131690562405976, "rougeL_precision_stderr": 0.001071674347816923, "rougeL_recall": 0.30470149207947667, "rougeL_recall_stderr": 0.004224186135139794, "rougeLsum_fmeasure": 0.09280326127954946, "rougeLsum_fmeasure_stderr": 0.0014767682135790052, "rougeLsum_precision": 0.05908274659378142, "rougeLsum_precision_stderr": 0.0011102880375707994, "rougeLsum_recall": 0.3110966005686351, "rougeLsum_recall_stderr": 0.004419284614315986}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.4836403082580132, "bleu_stderr": 0.04275891251756906, "rouge1_fmeasure": 0.16854478548066482, "rouge1_fmeasure_stderr": 0.0018569277613818772, "rouge1_precision": 0.1444356353252771, "rouge1_precision_stderr": 0.0018890228924276567, "rouge1_recall": 0.24333387644429813, "rouge1_recall_stderr": 0.0026067622578618776, "rouge2_fmeasure": 0.034308638506432475, "rouge2_fmeasure_stderr": 0.0008125402811211317, "rouge2_precision": 0.029280987606291494, "rouge2_precision_stderr": 0.0007237627275927142, "rouge2_recall": 0.05112009572683697, "rouge2_recall_stderr": 0.001337818306117227, "rougeL_fmeasure": 0.13358205180049998, "rougeL_fmeasure_stderr": 0.0013364507319559807, "rougeL_precision": 0.11294853294767912, "rougeL_precision_stderr": 0.0013180107899456023, "rougeL_recall": 0.19771034044326136, "rougeL_recall_stderr": 0.002117097962875754, "rougeLsum_fmeasure": 0.1549132489748441, "rougeLsum_fmeasure_stderr": 0.0016876295948321293, "rougeLsum_precision": 0.13255355115964793, "rougeLsum_precision_stderr": 0.0017152326851252678, "rougeLsum_recall": 0.2246765687186434, "rougeLsum_recall_stderr": 0.002420653997148166}}, "1": {"tldr_en": {"bleu": 1.368798582263273, "bleu_stderr": 0.03762251064773447, "rouge1_fmeasure": 0.16619267944887964, "rouge1_fmeasure_stderr": 0.001744164720654144, "rouge1_precision": 0.14337611363324493, "rouge1_precision_stderr": 0.0017975787265801645, "rouge1_recall": 0.2401884909277128, "rouge1_recall_stderr": 0.002577850850716675, "rouge2_fmeasure": 0.028880049821475656, "rouge2_fmeasure_stderr": 0.0007891070933473794, "rouge2_precision": 0.024778664535770947, "rouge2_precision_stderr": 0.0007555235233701629, "rouge2_recall": 0.04385427041760851, "rouge2_recall_stderr": 0.0013655854605521512, "rougeL_fmeasure": 0.12166495381666467, "rougeL_fmeasure_stderr": 0.0011944014882187845, "rougeL_precision": 0.10397637743893304, "rougeL_precision_stderr": 0.001235246358495789, "rougeL_recall": 0.18006724988321413, "rougeL_recall_stderr": 0.0019906559738365613, "rougeLsum_fmeasure": 0.15572261717667488, "rougeLsum_fmeasure_stderr": 0.0016216939170534584, "rougeLsum_precision": 0.13419081390261864, "rougeLsum_precision_stderr": 0.0016722655575097506, "rougeLsum_recall": 0.22568787667911147, "rougeLsum_recall_stderr": 0.002430850770097226}}, "2": {"tldr_en": {"bleu": 1.5622860462600348, "bleu_stderr": 0.043740854824911794, "rouge1_fmeasure": 0.17019067213369107, "rouge1_fmeasure_stderr": 0.0017690889374743603, "rouge1_precision": 0.15063044447280027, "rouge1_precision_stderr": 0.001940763130936743, "rouge1_recall": 0.23931115978829579, "rouge1_recall_stderr": 0.0024971943832608266, "rouge2_fmeasure": 0.033005228021297704, "rouge2_fmeasure_stderr": 0.0008241949468737384, "rouge2_precision": 0.029664097877505877, "rouge2_precision_stderr": 0.0009118238978394307, "rouge2_recall": 0.04760945326052988, "rouge2_recall_stderr": 0.001306711433850517, "rougeL_fmeasure": 0.131223027742424, "rougeL_fmeasure_stderr": 0.0012757407637194174, "rougeL_precision": 0.11542835667429227, "rougeL_precision_stderr": 0.0014439177169422246, "rougeL_recall": 0.18791535392357211, "rougeL_recall_stderr": 0.001981689065390633, "rougeLsum_fmeasure": 0.15936229418185377, "rougeLsum_fmeasure_stderr": 0.0016407771888788867, "rougeLsum_precision": 0.14098071498465764, "rougeLsum_precision_stderr": 0.001813064708734854, "rougeLsum_recall": 0.22467978591395918, "rougeLsum_recall_stderr": 0.0023443476592751983}}, "3": {"tldr_en": {"bleu": 1.5234316086072492, "bleu_stderr": 0.04994760816269213, "rouge1_fmeasure": 0.1459775119747986, "rouge1_fmeasure_stderr": 0.002013820231047812, "rouge1_precision": 0.13853097159476044, "rouge1_precision_stderr": 0.0024033845722523724, "rouge1_recall": 0.2022241539975303, "rouge1_recall_stderr": 0.002895744315329479, "rouge2_fmeasure": 0.02907493824937833, "rouge2_fmeasure_stderr": 0.0008064371846682719, "rouge2_precision": 0.027922753485106568, "rouge2_precision_stderr": 0.0010069321667728792, "rouge2_recall": 0.041810329656802245, "rouge2_recall_stderr": 0.00129627924231701, "rougeL_fmeasure": 0.11526184202559941, "rougeL_fmeasure_stderr": 0.0015132431316080114, "rougeL_precision": 0.10946213334283154, "rougeL_precision_stderr": 0.0019316172770680437, "rougeL_recall": 0.1624038367425624, "rougeL_recall_stderr": 0.0023444744969795006, "rougeLsum_fmeasure": 0.1361503335550405, "rougeLsum_fmeasure_stderr": 0.001865935511568599, "rougeLsum_precision": 0.1294243469444916, "rougeLsum_precision_stderr": 0.0022694744228463435, "rougeLsum_recall": 0.18910016521383136, "rougeLsum_recall_stderr": 0.0027080908132011243}}, "4": {"tldr_en": {"bleu": 0.41252863907826776, "bleu_stderr": 0.030373767513404697, "rouge1_fmeasure": 0.04937920113316496, "rouge1_fmeasure_stderr": 0.0017006423976957319, "rouge1_precision": 0.048283116115591836, "rouge1_precision_stderr": 0.0018762804337576465, "rouge1_recall": 0.07012389259959088, "rouge1_recall_stderr": 0.0024827186502375275, "rouge2_fmeasure": 0.010104805168030258, "rouge2_fmeasure_stderr": 0.0005574344481643184, "rouge2_precision": 0.009647802697589025, "rouge2_precision_stderr": 0.0006103768053178551, "rouge2_recall": 0.015261115214929618, "rouge2_recall_stderr": 0.0009960688572823394, "rougeL_fmeasure": 0.04024639157961486, "rougeL_fmeasure_stderr": 0.0013631991023636098, "rougeL_precision": 0.039482927106928814, "rougeL_precision_stderr": 0.0015510440139044537, "rougeL_recall": 0.05812150365824274, "rougeL_recall_stderr": 0.00207507825756795, "rougeLsum_fmeasure": 0.045827471133389246, "rougeLsum_fmeasure_stderr": 0.001572714794925252, "rougeLsum_precision": 0.04495702046511921, "rougeLsum_precision_stderr": 0.0017562417792707258, "rougeLsum_recall": 0.06533375820468378, "rougeLsum_recall_stderr": 0.0023195859576008596}}, "5": {"tldr_en": {"bleu": 1.1512232954144342e-06, "bleu_stderr": 2.094932653320538e-06, "rouge1_fmeasure": 0.008092466035741461, "rouge1_fmeasure_stderr": 0.0007725180183102787, "rouge1_precision": 0.008053948401330599, "rouge1_precision_stderr": 0.0008246264662235712, "rouge1_recall": 0.011572381851776472, "rouge1_recall_stderr": 0.0011296167548172531, "rouge2_fmeasure": 0.0016583152317218213, "rouge2_fmeasure_stderr": 0.00024030776163960353, "rouge2_precision": 0.0016487162145299862, "rouge2_precision_stderr": 0.00028855076065369416, "rouge2_recall": 0.002359034970945986, "rouge2_recall_stderr": 0.00033523534751396603, "rougeL_fmeasure": 0.006591147101382126, "rougeL_fmeasure_stderr": 0.0006203194340556792, "rougeL_precision": 0.006581900525062106, "rougeL_precision_stderr": 0.0006767336687555497, "rougeL_recall": 0.009604072556401588, "rougeL_recall_stderr": 0.0009440395007256133, "rougeLsum_fmeasure": 0.00747305417348784, "rougeLsum_fmeasure_stderr": 0.000709782509687814, "rougeLsum_precision": 0.007446672471389, "rougeLsum_precision_stderr": 0.0007645726188902775, "rougeLsum_recall": 0.01074764632172318, "rougeLsum_recall_stderr": 0.0010438920929096284}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 0.7454534998692752, "bleu_stderr": 0.07804428323713496, "rouge1_fmeasure": 0.03918099607350703, "rouge1_fmeasure_stderr": 0.001448534494550284, "rouge1_precision": 0.06474609956563113, "rouge1_precision_stderr": 0.002808015303613375, "rouge1_recall": 0.0348307362954131, "rouge1_recall_stderr": 0.0014091894165256253, "rouge2_fmeasure": 0.008523314750914139, "rouge2_fmeasure_stderr": 0.00063055748185768, "rouge2_precision": 0.016683043975980968, "rouge2_precision_stderr": 0.0014447318755830502, "rouge2_recall": 0.007670856047129852, "rouge2_recall_stderr": 0.0005580500848436268, "rougeL_fmeasure": 0.033916243277006014, "rougeL_fmeasure_stderr": 0.001231432823341605, "rougeL_precision": 0.05551189449248439, "rougeL_precision_stderr": 0.00238259584939437, "rougeL_recall": 0.03040510241026872, "rougeL_recall_stderr": 0.0012245380288356473, "rougeLsum_fmeasure": 0.033158173617653046, "rougeLsum_fmeasure_stderr": 0.0011976728573487477, "rougeLsum_precision": 0.054968825384225664, "rougeLsum_precision_stderr": 0.0023305151110030124, "rougeLsum_recall": 0.02911562853755617, "rougeLsum_recall_stderr": 0.0011623178626526266}}, "1": {"generate_text_restaurant": {"bleu": 5.487694889793941, "bleu_stderr": 0.07555119011558427, "rouge1_fmeasure": 0.3321953827037549, "rouge1_fmeasure_stderr": 0.0020364301991294543, "rouge1_precision": 0.3097058053229197, "rouge1_precision_stderr": 0.002851087946324211, "rouge1_recall": 0.43110365850951743, "rouge1_recall_stderr": 0.002732778963977049, "rouge2_fmeasure": 0.13126151027829455, "rouge2_fmeasure_stderr": 0.001411164906927139, "rouge2_precision": 0.12287476036716052, "rouge2_precision_stderr": 0.0016877708444218635, "rouge2_recall": 0.17280953287169348, "rouge2_recall_stderr": 0.0019134667041499913, "rougeL_fmeasure": 0.24346830553368265, "rougeL_fmeasure_stderr": 0.0014712983587429052, "rougeL_precision": 0.22519107207919958, "rougeL_precision_stderr": 0.002044768338085085, "rougeL_recall": 0.32069030400568344, "rougeL_recall_stderr": 0.0022416724958190157, "rougeLsum_fmeasure": 0.2746466676619327, "rougeLsum_fmeasure_stderr": 0.0018777824275120166, "rougeLsum_precision": 0.25598458046409817, "rougeLsum_precision_stderr": 0.002501331832178447, "rougeLsum_recall": 0.35721132057108596, "rougeLsum_recall_stderr": 0.002561727405040063}}, "2": {"generate_text_restaurant": {"bleu": 6.079188977413186, "bleu_stderr": 0.09602875924306557, "rouge1_fmeasure": 0.346570361859306, "rouge1_fmeasure_stderr": 0.002052145530841731, "rouge1_precision": 0.3181407194694957, "rouge1_precision_stderr": 0.0029777295615160512, "rouge1_recall": 0.4561708867688496, "rouge1_recall_stderr": 0.0026452494137559723, "rouge2_fmeasure": 0.14693316116112215, "rouge2_fmeasure_stderr": 0.0014445847251510187, "rouge2_precision": 0.13642028395369205, "rouge2_precision_stderr": 0.0018950492351855646, "rouge2_recall": 0.19647624995791846, "rouge2_recall_stderr": 0.0019636015048637256, "rougeL_fmeasure": 0.25482744735128565, "rougeL_fmeasure_stderr": 0.0014755904280259592, "rougeL_precision": 0.2315672124269367, "rougeL_precision_stderr": 0.002127274716028904, "rougeL_recall": 0.3415431295705076, "rougeL_recall_stderr": 0.0022584378328241905, "rougeLsum_fmeasure": 0.2890174556326334, "rougeLsum_fmeasure_stderr": 0.0018995638277943165, "rougeLsum_precision": 0.2655109833740872, "rougeLsum_precision_stderr": 0.002636322289847473, "rougeLsum_recall": 0.38142593418332454, "rougeLsum_recall_stderr": 0.002536630793778901}}, "3": {"generate_text_restaurant": {"bleu": 5.439720663780092, "bleu_stderr": 0.09057671754019295, "rouge1_fmeasure": 0.35966978129457794, "rouge1_fmeasure_stderr": 0.0020809245391192944, "rouge1_precision": 0.33806886805387837, "rouge1_precision_stderr": 0.0031451949821916397, "rouge1_recall": 0.4597540434384101, "rouge1_recall_stderr": 0.0025911053727046204, "rouge2_fmeasure": 0.15787398183922485, "rouge2_fmeasure_stderr": 0.00151813234143548, "rouge2_precision": 0.15002040777811748, "rouge2_precision_stderr": 0.0019728388177885454, "rouge2_recall": 0.2046175785902067, "rouge2_recall_stderr": 0.001988761577155802, "rougeL_fmeasure": 0.26303596646553673, "rougeL_fmeasure_stderr": 0.001522516609384217, "rougeL_precision": 0.24363492051808863, "rougeL_precision_stderr": 0.0021801249774331755, "rougeL_recall": 0.3434646349475326, "rougeL_recall_stderr": 0.00230667877920879, "rougeLsum_fmeasure": 0.2981457337030485, "rougeLsum_fmeasure_stderr": 0.001964234489421683, "rougeLsum_precision": 0.2803542384188989, "rougeLsum_precision_stderr": 0.002777229104092061, "rougeLsum_recall": 0.3816738562894357, "rougeLsum_recall_stderr": 0.0025233042461889513}}, "4": {"generate_text_restaurant": {"bleu": 3.9189279109719335, "bleu_stderr": 0.08586279820080885, "rouge1_fmeasure": 0.3836182432795783, "rouge1_fmeasure_stderr": 0.0022054074783422308, "rouge1_precision": 0.39213707891049004, "rouge1_precision_stderr": 0.003422529928577996, "rouge1_recall": 0.44238533983355405, "rouge1_recall_stderr": 0.0025751632202055024, "rouge2_fmeasure": 0.17345256590048624, "rouge2_fmeasure_stderr": 0.001662967964824317, "rouge2_precision": 0.17932569557247965, "rouge2_precision_stderr": 0.0021875288020798776, "rouge2_recall": 0.2014446351152472, "rouge2_recall_stderr": 0.001986701156425044, "rougeL_fmeasure": 0.27924589416548823, "rougeL_fmeasure_stderr": 0.0017055264106925416, "rougeL_precision": 0.2822423599102126, "rougeL_precision_stderr": 0.002501678088025689, "rougeL_recall": 0.32790464597969743, "rougeL_recall_stderr": 0.0022994271661774903, "rougeLsum_fmeasure": 0.31650257132624704, "rougeLsum_fmeasure_stderr": 0.002105427772389244, "rougeLsum_precision": 0.3236183940771683, "rougeLsum_precision_stderr": 0.0030448679972683726, "rougeLsum_recall": 0.3650546853387208, "rougeLsum_recall_stderr": 0.002486300924606491}}, "5": {"generate_text_restaurant": {"bleu": 3.0686372723608897, "bleu_stderr": 0.06784266491877249, "rouge1_fmeasure": 0.4095857053929965, "rouge1_fmeasure_stderr": 0.0021530995714477558, "rouge1_precision": 0.4502554374503682, "rouge1_precision_stderr": 0.0033630982834692595, "rouge1_recall": 0.42945542013401933, "rouge1_recall_stderr": 0.002595990607765447, "rouge2_fmeasure": 0.18712397033462674, "rouge2_fmeasure_stderr": 0.0017078080439781192, "rouge2_precision": 0.20886191169135895, "rouge2_precision_stderr": 0.0023179990401586887, "rouge2_recall": 0.1967893746603374, "rouge2_recall_stderr": 0.001931221479807446, "rougeL_fmeasure": 0.29430723400568193, "rougeL_fmeasure_stderr": 0.001762954764782701, "rougeL_precision": 0.32145296922919064, "rougeL_precision_stderr": 0.0025789465971034213, "rougeL_recall": 0.3125724382034645, "rougeL_recall_stderr": 0.002290959462627688, "rougeLsum_fmeasure": 0.335707785812935, "rougeLsum_fmeasure_stderr": 0.0020851385129732505, "rougeLsum_precision": 0.36887628081177687, "rougeLsum_precision_stderr": 0.00302325518602794, "rougeLsum_recall": 0.3523561197227813, "rougeLsum_recall_stderr": 0.002466960449053646}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.3841560907125259, "bleu_stderr": 0.07797827326949171, "rouge1_fmeasure": 0.19123744824446468, "rouge1_fmeasure_stderr": 0.0022992268247988583, "rouge1_precision": 0.13656588620899038, "rouge1_precision_stderr": 0.00174226154738388, "rouge1_recall": 0.3323235396298205, "rouge1_recall_stderr": 0.003846536397189559, "rouge2_fmeasure": 0.0362962242227074, "rouge2_fmeasure_stderr": 0.0012357989639325655, "rouge2_precision": 0.025701014397443208, "rouge2_precision_stderr": 0.0008822864860028765, "rouge2_recall": 0.06451842393614433, "rouge2_recall_stderr": 0.0022307575351008177, "rougeL_fmeasure": 0.14272621341641745, "rougeL_fmeasure_stderr": 0.0016087589844111059, "rougeL_precision": 0.10175956050352102, "rougeL_precision_stderr": 0.0012156226058548923, "rougeL_recall": 0.24958177981302834, "rougeL_recall_stderr": 0.0028231998096754063, "rougeLsum_fmeasure": 0.15074429962396632, "rougeLsum_fmeasure_stderr": 0.0018801101946759444, "rougeLsum_precision": 0.1074311808382226, "rougeLsum_precision_stderr": 0.0014050024971339861, "rougeLsum_recall": 0.2636816826721476, "rougeLsum_recall_stderr": 0.0032819789427964595}}, "1": {"article_DOC_summary": {"bleu": 0.7666050226687372, "bleu_stderr": 0.06474629405034218, "rouge1_fmeasure": 0.1490109968360671, "rouge1_fmeasure_stderr": 0.0021151321607124005, "rouge1_precision": 0.10551189065335231, "rouge1_precision_stderr": 0.0015632545047201442, "rouge1_recall": 0.26396369315037715, "rouge1_recall_stderr": 0.0036356422465613878, "rouge2_fmeasure": 0.021870860381131174, "rouge2_fmeasure_stderr": 0.0010335421346335594, "rouge2_precision": 0.015258372576455077, "rouge2_precision_stderr": 0.0007194850115847547, "rouge2_recall": 0.0401042986262725, "rouge2_recall_stderr": 0.0019569862879314013, "rougeL_fmeasure": 0.11776037181510428, "rougeL_fmeasure_stderr": 0.0015663569819055773, "rougeL_precision": 0.08322301164562862, "rougeL_precision_stderr": 0.0011487703143784498, "rougeL_recall": 0.20979036419712682, "rougeL_recall_stderr": 0.0028033758287091875, "rougeLsum_fmeasure": 0.11905956031628537, "rougeLsum_fmeasure_stderr": 0.0017138611513238453, "rougeLsum_precision": 0.08413103520980872, "rougeLsum_precision_stderr": 0.001254290848777802, "rougeLsum_recall": 0.21222983148038477, "rougeLsum_recall_stderr": 0.00304896385565602}}, "2": {"article_DOC_summary": {"bleu": 0.8345839792934845, "bleu_stderr": 0.09663801407092908, "rouge1_fmeasure": 0.15152826480726653, "rouge1_fmeasure_stderr": 0.002114221677973485, "rouge1_precision": 0.10715846509597497, "rouge1_precision_stderr": 0.0015697108273323291, "rouge1_recall": 0.2695418218368475, "rouge1_recall_stderr": 0.0036206648240501645, "rouge2_fmeasure": 0.023831872627776102, "rouge2_fmeasure_stderr": 0.001048493003352801, "rouge2_precision": 0.01667569031887618, "rouge2_precision_stderr": 0.0007375139406724271, "rouge2_recall": 0.043570635275517515, "rouge2_recall_stderr": 0.0019441097483278629, "rougeL_fmeasure": 0.12053707825720893, "rougeL_fmeasure_stderr": 0.0015925749869109209, "rougeL_precision": 0.08504138318382073, "rougeL_precision_stderr": 0.0011733846471463298, "rougeL_recall": 0.21610444539656637, "rougeL_recall_stderr": 0.002873607280157199, "rougeLsum_fmeasure": 0.12141179293846815, "rougeLsum_fmeasure_stderr": 0.0017373975644363541, "rougeLsum_precision": 0.0856088008772477, "rougeLsum_precision_stderr": 0.0012678716431980997, "rougeLsum_recall": 0.21768648734893284, "rougeLsum_recall_stderr": 0.003115267847510722}}, "3": {"article_DOC_summary": {"bleu": 0.9311539798670635, "bleu_stderr": 0.09107540142081379, "rouge1_fmeasure": 0.14641419405475198, "rouge1_fmeasure_stderr": 0.0022626874492042907, "rouge1_precision": 0.10606297790246366, "rouge1_precision_stderr": 0.0017854168680511101, "rouge1_recall": 0.2559365393746863, "rouge1_recall_stderr": 0.003942828057917467, "rouge2_fmeasure": 0.023068148270822337, "rouge2_fmeasure_stderr": 0.001082001329317035, "rouge2_precision": 0.016403947053914306, "rouge2_precision_stderr": 0.0007741120118238733, "rouge2_recall": 0.04155268993757446, "rouge2_recall_stderr": 0.002004912080845838, "rougeL_fmeasure": 0.11651320027532101, "rougeL_fmeasure_stderr": 0.0017495857212361317, "rougeL_precision": 0.08438433169380888, "rougeL_precision_stderr": 0.0013959138179342146, "rougeL_recall": 0.20443934586419923, "rougeL_recall_stderr": 0.003127827147724924, "rougeLsum_fmeasure": 0.11708695716505582, "rougeLsum_fmeasure_stderr": 0.0018525946257683778, "rougeLsum_precision": 0.08473700150035146, "rougeLsum_precision_stderr": 0.0014635025254577177, "rougeLsum_recall": 0.20585072949190508, "rougeLsum_recall_stderr": 0.003317649942197773}}, "4": {"article_DOC_summary": {"bleu": 0.41043347346219244, "bleu_stderr": 0.1486020805997744, "rouge1_fmeasure": 0.03857476484604358, "rouge1_fmeasure_stderr": 0.002181373104120625, "rouge1_precision": 0.033538556464056984, "rouge1_precision_stderr": 0.002282970207590659, "rouge1_recall": 0.061278166608827844, "rouge1_recall_stderr": 0.0035032648267361863, "rouge2_fmeasure": 0.004640907524463805, "rouge2_fmeasure_stderr": 0.000536562366213917, "rouge2_precision": 0.00356863909695226, "rouge2_precision_stderr": 0.00043019877312427664, "rouge2_recall": 0.007827354388277672, "rouge2_recall_stderr": 0.000890140246104386, "rougeL_fmeasure": 0.03084447504069215, "rougeL_fmeasure_stderr": 0.001708948915334388, "rougeL_precision": 0.026997141398160576, "rougeL_precision_stderr": 0.001907201107733291, "rougeL_recall": 0.049289096496901386, "rougeL_recall_stderr": 0.0027778936304874483, "rougeLsum_fmeasure": 0.03116504304791766, "rougeLsum_fmeasure_stderr": 0.0017650576678384076, "rougeLsum_precision": 0.027395316222004706, "rougeLsum_precision_stderr": 0.0019605932238404397, "rougeLsum_recall": 0.04960704068168692, "rougeLsum_recall_stderr": 0.002857971818835903}}, "5": {"article_DOC_summary": {"bleu": 1.7812749842983558e-39, "bleu_stderr": 6.173625004905157e-36, "rouge1_fmeasure": 0.0018825860372170817, "rouge1_fmeasure_stderr": 0.0005105425641834596, "rouge1_precision": 0.0021237847249880666, "rouge1_precision_stderr": 0.0005810244101355184, "rouge1_recall": 0.00177754327837735, "rouge1_recall_stderr": 0.00048757744409275904, "rouge2_fmeasure": 0.00019318274102930717, "rouge2_fmeasure_stderr": 0.00015698812424376165, "rouge2_precision": 0.00019654088050314464, "rouge2_precision_stderr": 0.00015261564209740738, "rouge2_recall": 0.00019511149228130362, "rouge2_recall_stderr": 0.00016439589503089688, "rougeL_fmeasure": 0.0015759792816185546, "rougeL_fmeasure_stderr": 0.00043710297005663255, "rougeL_precision": 0.0017497614736063241, "rougeL_precision_stderr": 0.00048095662458468534, "rougeL_recall": 0.001513011919166749, "rougeL_recall_stderr": 0.0004307689764831507, "rougeLsum_fmeasure": 0.0016704094537401807, "rougeLsum_fmeasure_stderr": 0.000463071140217582, "rougeLsum_precision": 0.0018510098059867322, "rougeLsum_precision_stderr": 0.000507889962370857, "rougeLsum_recall": 0.0016014978567092907, "rougeLsum_recall_stderr": 0.0004541344456295751}}}} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..39b71ccdae22d4f68bbef6b909b0d25b772ad659 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.31005545889675595, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.024221663303322493 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06333959745402563, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0017129657332336005 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2660634003689691, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004758664963766919 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09455536275767198, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020202782477753084 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.02992387161371905, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010678757643085887 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.13162654248190145, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003224162069371238 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.045045993698642706, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012585799900103791 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.061154332270835166, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015925366548222631 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.26067769163704907, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004663300404214987 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09174293269832776, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018940760825308196 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06064250474249417, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001621939447674481 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.25579533250119046, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004509656638017682 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.0906091189082405, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001901338184221523 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..156ba58cb17ce4cf74c00407c2c08926915b2a7c --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3253498336709165, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03212142507533847 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.060918256661001154, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001387907396461889 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3063168556661825, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005105195108996422 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09469312150361009, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001863178804950363 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.027316953543545387, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008360022968447658 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1391741163483647, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032268292328296168 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.042453810034119334, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001154483862783651 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05742537248926894, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012621921122595368 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2883872431662452, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004673161214630172 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08927770465065916, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016929550946172228 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.058015541222877484, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013118024160571136 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2900074000424914, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0046821199593389245 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09008895599436548, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017491206522219078 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..fb5810f559a61ea12efc80a3b17c061346684a12 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.31791276568975185, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02727147856829631 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.05962717338634471, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.00126061681638203 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.30756287355829814, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004889305792734938 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09336715846217024, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016996772402870365 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.02670280090842877, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007604338404443195 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.14249676402659822, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032896138546168476 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04191645296449831, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010709241966443265 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05627058448383118, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011470016078651416 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2896458162973523, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0044554794302764 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08815984465580837, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015470326777333359 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.05706756866828331, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012020871707703095 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.292251335959323, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004510651275741409 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.08926200923694406, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001613762141288785 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ffca4a3d3caa57fbf9bfdfe78cf89a4af897c5ea --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3212440432130126, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02833396914504117 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06018320328990788, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012792421021156602 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.31701882107369783, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004918042604954739 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09437325152413317, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016293117647949373 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.02718506309171944, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000834511570552857 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.14788498862069166, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0033325099175022747 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.042391214062896254, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010316080252432995 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05656198333950361, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011649029158652883 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2959773638751678, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004411378256218955 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08870171226199733, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014934510170629485 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.05732291421825896, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012233313963698896 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3008574516119203, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004550770798562808 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.0897987691484568, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015399085797828443 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ab5c3b32713a9aeb443424605ff2cd3c4a547b9a --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.34701320585063394, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.012982772867681795 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06139220025240579, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001204641896215659 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.32370589082989293, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004818041311873955 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09652792542278772, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0015764734075382092 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.027393636493786414, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007666521742975135 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.15165230865373422, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003290995473977093 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.043124737274736084, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010143599611912326 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.057858738343212236, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011371996173128948 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3014171252596505, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004324422192213472 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09083921184905662, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014744271896824609 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.05856942284861244, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011580171724704853 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.30659074236282113, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004443465919036145 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09197412784787223, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015015595131035856 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..f8440facbaff6ce9797caa2d6ae1545bb9496b3a --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3826134137609412, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.027260987836796497 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06210934649298242, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0011637172836219596 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.32987573012277627, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0048175275958975364 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09769981149870674, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0015568330004171944 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.027334516755102147, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006792346244010215 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1540494964221242, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0033061515191188284 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04331193468813116, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009723654636517451 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.058131690562405976, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001071674347816923 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.30470149207947667, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004224186135139794 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09131104015906616, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014304797258199975 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.05908274659378142, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011102880375707994 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3110966005686351, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004419284614315986 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09280326127954946, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0014767682135790052 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..abce41e174b892225a59f7d9184e279168882f29 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1444356353252771, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018890228924276567 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.24333387644429813, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0026067622578618776 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.16854478548066482, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018569277613818772 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.029280987606291494, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007237627275927142 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05112009572683697, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001337818306117227 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.034308638506432475, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008125402811211317 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11294853294767912, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013180107899456023 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.19771034044326136, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002117097962875754 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13358205180049998, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013364507319559807 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13255355115964793, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017152326851252678 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2246765687186434, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002420653997148166 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1549132489748441, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016876295948321293 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.4836403082580132, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04275891251756906 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..0b37908ed67fdafc911fbbe6a83a9297b5aa0e80 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.14337611363324493, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0017975787265801645 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2401884909277128, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002577850850716675 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.16619267944887964, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001744164720654144 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.024778664535770947, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007555235233701629 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04385427041760851, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0013655854605521512 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.028880049821475656, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007891070933473794 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10397637743893304, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001235246358495789 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.18006724988321413, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0019906559738365613 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12166495381666467, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0011944014882187845 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13419081390261864, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016722655575097506 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.22568787667911147, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002430850770097226 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15572261717667488, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016216939170534584 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.368798582263273, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03762251064773447 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..ca5f96434300f139eae049e589020c6c7a0382b7 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15063044447280027, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001940763130936743 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.23931115978829579, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0024971943832608266 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17019067213369107, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017690889374743603 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.029664097877505877, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009118238978394307 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04760945326052988, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001306711433850517 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.033005228021297704, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008241949468737384 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11542835667429227, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014439177169422246 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.18791535392357211, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.001981689065390633 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.131223027742424, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012757407637194174 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.14098071498465764, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001813064708734854 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.22467978591395918, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0023443476592751983 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15936229418185377, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016407771888788867 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5622860462600348, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.043740854824911794 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..3ab1ccd3fe5f800103d58f6c164d8fe78649312d --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.13853097159476044, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0024033845722523724 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2022241539975303, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002895744315329479 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1459775119747986, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002013820231047812 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.027922753485106568, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010069321667728792 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.041810329656802245, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00129627924231701 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.02907493824937833, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008064371846682719 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10946213334283154, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0019316172770680437 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1624038367425624, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0023444744969795006 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.11526184202559941, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015132431316080114 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1294243469444916, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0022694744228463435 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.18910016521383136, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027080908132011243 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1361503335550405, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001865935511568599 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5234316086072492, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04994760816269213 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..dccc9cce49c1cc491529dfd0b6220ee1d7b289f4 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.048283116115591836, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018762804337576465 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.07012389259959088, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0024827186502375275 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.04937920113316496, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017006423976957319 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.009647802697589025, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006103768053178551 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.015261115214929618, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0009960688572823394 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.010104805168030258, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0005574344481643184 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.039482927106928814, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015510440139044537 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.05812150365824274, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00207507825756795 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.04024639157961486, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013631991023636098 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.04495702046511921, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017562417792707258 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.06533375820468378, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0023195859576008596 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.045827471133389246, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001572714794925252 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.41252863907826776, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.030373767513404697 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ef95e9ffc2e41a2516477ee0f0edc043cc5c0c2b --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.008053948401330599, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0008246264662235712 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.011572381851776472, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0011296167548172531 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.008092466035741461, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0007725180183102787 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0016487162145299862, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00028855076065369416 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.002359034970945986, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00033523534751396603 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0016583152317218213, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00024030776163960353 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.006581900525062106, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0006767336687555497 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.009604072556401588, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0009440395007256133 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006591147101382126, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006203194340556792 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.007446672471389, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0007645726188902775 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.01074764632172318, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0010438920929096284 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.00747305417348784, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.000709782509687814 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.1512232954144342e-06, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 2.094932653320538e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..986cd4ee08a5fa30da59fe9be4354b65924a8c5e --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.7454534998692752, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.07804428323713496 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.06474609956563113, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002808015303613375 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.0348307362954131, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0014091894165256253 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.03918099607350703, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.001448534494550284 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.016683043975980968, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0014447318755830502 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.007670856047129852, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0005580500848436268 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.008523314750914139, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.00063055748185768 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.05551189449248439, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.00238259584939437 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.03040510241026872, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0012245380288356473 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.033916243277006014, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001231432823341605 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.054968825384225664, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0023305151110030124 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.02911562853755617, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0011623178626526266 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.033158173617653046, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0011976728573487477 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..7ed7e597fbaaa64d95435f5407f75d505effe3d1 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.487694889793941, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.07555119011558427 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3097058053229197, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002851087946324211 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.43110365850951743, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002732778963977049 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3321953827037549, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0020364301991294543 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.12287476036716052, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0016877708444218635 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.17280953287169348, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0019134667041499913 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.13126151027829455, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001411164906927139 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.22519107207919958, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002044768338085085 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.32069030400568344, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022416724958190157 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.24346830553368265, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0014712983587429052 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.25598458046409817, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002501331832178447 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.35721132057108596, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002561727405040063 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2746466676619327, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018777824275120166 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d1fc372a55d8d878785f3a7ecd773e98c4ba1833 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.079188977413186, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.09602875924306557 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3181407194694957, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0029777295615160512 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4561708867688496, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0026452494137559723 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.346570361859306, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002052145530841731 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.13642028395369205, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0018950492351855646 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.19647624995791846, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0019636015048637256 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.14693316116112215, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0014445847251510187 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2315672124269367, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002127274716028904 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3415431295705076, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022584378328241905 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.25482744735128565, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0014755904280259592 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2655109833740872, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002636322289847473 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.38142593418332454, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002536630793778901 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2890174556326334, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018995638277943165 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..122e2052ac117b875d399deb697402cd815ee5c5 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.439720663780092, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.09057671754019295 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.33806886805387837, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031451949821916397 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4597540434384101, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0025911053727046204 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.35966978129457794, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0020809245391192944 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.15002040777811748, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0019728388177885454 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2046175785902067, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001988761577155802 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.15787398183922485, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.00151813234143548 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.24363492051808863, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0021801249774331755 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3434646349475326, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.00230667877920879 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.26303596646553673, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001522516609384217 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2803542384188989, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002777229104092061 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3816738562894357, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025233042461889513 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2981457337030485, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001964234489421683 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..6a5574bce9a7f76b287f6f1db48a11e1d102d422 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 3.9189279109719335, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.08586279820080885 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.39213707891049004, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003422529928577996 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.44238533983355405, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0025751632202055024 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3836182432795783, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022054074783422308 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.17932569557247965, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0021875288020798776 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2014446351152472, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001986701156425044 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.17345256590048624, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001662967964824317 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2822423599102126, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002501678088025689 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.32790464597969743, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022994271661774903 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.27924589416548823, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017055264106925416 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3236183940771683, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0030448679972683726 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3650546853387208, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002486300924606491 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.31650257132624704, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002105427772389244 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..3721b9be4b87081612825206eecd5b1401ae8efd --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 3.0686372723608897, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.06784266491877249 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4502554374503682, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0033630982834692595 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.42945542013401933, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002595990607765447 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4095857053929965, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021530995714477558 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.20886191169135895, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0023179990401586887 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1967893746603374, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001931221479807446 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.18712397033462674, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0017078080439781192 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.32145296922919064, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0025789465971034213 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3125724382034645, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002290959462627688 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.29430723400568193, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001762954764782701 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.36887628081177687, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.00302325518602794 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3523561197227813, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002466960449053646 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.335707785812935, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020851385129732505 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_0.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..096689c3c52c6545d2063696dd3680123595025d --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.13656588620899038, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.00174226154738388 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3323235396298205, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003846536397189559 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.19123744824446468, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0022992268247988583 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.025701014397443208, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0008822864860028765 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06451842393614433, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0022307575351008177 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0362962242227074, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0012357989639325655 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10175956050352102, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0012156226058548923 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24958177981302834, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0028231998096754063 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14272621341641745, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0016087589844111059 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.1074311808382226, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014050024971339861 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2636816826721476, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0032819789427964595 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.15074429962396632, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0018801101946759444 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.3841560907125259, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07797827326949171 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_1.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..6ed203aa91d033066beb65ee263b915440afcc38 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.10551189065335231, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0015632545047201442 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.26396369315037715, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0036356422465613878 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1490109968360671, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0021151321607124005 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.015258372576455077, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0007194850115847547 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0401042986262725, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0019569862879314013 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.021870860381131174, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0010335421346335594 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08322301164562862, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0011487703143784498 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.20979036419712682, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0028033758287091875 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.11776037181510428, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0015663569819055773 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.08413103520980872, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001254290848777802 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.21222983148038477, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.00304896385565602 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.11905956031628537, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0017138611513238453 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.7666050226687372, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.06474629405034218 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_2.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..97d48d2180ca3427d6ae215d809b6e441a030d48 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.10715846509597497, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0015697108273323291 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2695418218368475, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0036206648240501645 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.15152826480726653, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002114221677973485 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.01667569031887618, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0007375139406724271 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.043570635275517515, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0019441097483278629 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.023831872627776102, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001048493003352801 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08504138318382073, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0011733846471463298 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.21610444539656637, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002873607280157199 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.12053707825720893, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0015925749869109209 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0856088008772477, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0012678716431980997 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.21768648734893284, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003115267847510722 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.12141179293846815, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0017373975644363541 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.8345839792934845, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09663801407092908 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_3.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4347a944341c8424f50545cb8d35d10e7a2fcbc4 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.10606297790246366, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017854168680511101 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2559365393746863, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003942828057917467 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.14641419405475198, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0022626874492042907 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.016403947053914306, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0007741120118238733 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.04155268993757446, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002004912080845838 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.023068148270822337, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001082001329317035 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08438433169380888, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013959138179342146 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.20443934586419923, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003127827147724924 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.11651320027532101, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0017495857212361317 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.08473700150035146, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014635025254577177 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.20585072949190508, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003317649942197773 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.11708695716505582, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0018525946257683778 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.9311539798670635, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09107540142081379 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_4.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..57a6a9f93caf14935ba860f3836c9856458f4819 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.033538556464056984, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002282970207590659 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.061278166608827844, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0035032648267361863 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.03857476484604358, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002181373104120625 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.00356863909695226, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00043019877312427664 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.007827354388277672, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.000890140246104386 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.004640907524463805, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.000536562366213917 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.026997141398160576, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001907201107733291 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.049289096496901386, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0027778936304874483 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.03084447504069215, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001708948915334388 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.027395316222004706, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0019605932238404397 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.04960704068168692, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.002857971818835903 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03116504304791766, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0017650576678384076 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.41043347346219244, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.1486020805997744 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_5.json b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..6f7430c9861e0d368cccdd80c8e5771095375e9e --- /dev/null +++ b/1b121b21bc4seed1/evaluation/generation/slim.1b121b21bc4seed1_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0021237847249880666, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0005810244101355184 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.00177754327837735, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.00048757744409275904 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.0018825860372170817, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0005105425641834596 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.00019654088050314464, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00015261564209740738 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.00019511149228130362, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00016439589503089688 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.00019318274102930717, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00015698812424376165 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0017497614736063241, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.00048095662458468534 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.001513011919166749, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0004307689764831507 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0015759792816185546, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.00043710297005663255 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0018510098059867322, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.000507889962370857 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0016014978567092907, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0004541344456295751 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0016704094537401807, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.000463071140217582 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.7812749842983558e-39, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 6.173625004905157e-36 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_0.csv b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..be43bc7a2a96f86a5e06c9622eac2dfd8d0579f7 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.331,0.014888272588203933,0 +anli_r2,acc,0.337,0.014955087918653602,0 +anli_r3,acc,0.3375,0.013655897185463657,0 +arc_challenge,acc,0.20733788395904437,0.011846905782971361,0 +arc_challenge,acc_norm,0.24914675767918087,0.012639407111926439,0 +arc_easy,acc,0.5046296296296297,0.01025934370588973,0 +arc_easy,acc_norm,0.44276094276094274,0.010192333348394462,0 +boolq,acc,0.5681957186544343,0.008663332644225124,1 +cb,acc,0.44642857142857145,0.06703189227942398,1 +cb,f1,0.24357864357864356,,1 +copa,acc,0.7,0.046056618647183814,0 +hellaswag,acc,0.3563035251941844,0.004779276329704052,0 +hellaswag,acc_norm,0.43547102170882296,0.004948052131344501,0 +piqa,acc,0.6953210010881393,0.010738889044325161,0 +piqa,acc_norm,0.6996735582154516,0.01069522530818314,0 +rte,acc,0.5270758122743683,0.030052303463143706,0 +sciq,acc,0.789,0.01290913032104209,0 +sciq,acc_norm,0.682,0.014734079309311901,0 +storycloze_2016,acc,0.6365579903794762,0.01112284144205971,0 +winogrande,acc,0.5280189423835833,0.014030404213405786,0 diff --git a/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_0.json b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_0.json new file mode 100644 index 0000000000000000000000000000000000000000..05acef8205f6fcb46c3d2c8ad045d25eecd56a6a --- /dev/null +++ b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.331, + "acc_stderr": 0.014888272588203933 + }, + "anli_r2": { + "acc": 0.337, + "acc_stderr": 0.014955087918653602 + }, + "anli_r3": { + "acc": 0.3375, + "acc_stderr": 0.013655897185463657 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942398, + "f1": 0.24357864357864356 + }, + "copa": { + "acc": 0.7, + "acc_stderr": 0.046056618647183814 + }, + "hellaswag": { + "acc": 0.3563035251941844, + "acc_stderr": 0.004779276329704052, + "acc_norm": 0.43547102170882296, + "acc_norm_stderr": 0.004948052131344501 + }, + "rte": { + "acc": 0.5270758122743683, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.5280189423835833, + "acc_stderr": 0.014030404213405786 + }, + "storycloze_2016": { + "acc": 0.6365579903794762, + "acc_stderr": 0.01112284144205971 + }, + "boolq": { + "acc": 0.5681957186544343, + "acc_stderr": 0.008663332644225124 + }, + "arc_easy": { + "acc": 0.5046296296296297, + "acc_stderr": 0.01025934370588973, + "acc_norm": 0.44276094276094274, + "acc_norm_stderr": 0.010192333348394462 + }, + "arc_challenge": { + "acc": 0.20733788395904437, + "acc_stderr": 0.011846905782971361, + "acc_norm": 0.24914675767918087, + "acc_norm_stderr": 0.012639407111926439 + }, + "sciq": { + "acc": 0.789, + "acc_stderr": 0.01290913032104209, + "acc_norm": 0.682, + "acc_norm_stderr": 0.014734079309311901 + }, + "piqa": { + "acc": 0.6953210010881393, + "acc_stderr": 0.010738889044325161, + "acc_norm": 0.6996735582154516, + "acc_norm_stderr": 0.01069522530818314 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_1.csv b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..06cf0d741c662f0c9cdcf7d82ac7977e0b351639 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.332,0.01489959724281148,0 +anli_r2,acc,0.351,0.015100563798316402,0 +anli_r3,acc,0.3225,0.013499258621103244,0 +arc_challenge,acc,0.23464163822525597,0.012383873560768673,0 +arc_challenge,acc_norm,0.25853242320819114,0.012794553754288679,0 +arc_easy,acc,0.5113636363636364,0.010257133441117113,0 +arc_easy,acc_norm,0.4617003367003367,0.01022963982061052,0 +boolq,acc,0.5581039755351682,0.008685806399014942,1 +cb,acc,0.5178571428571429,0.06737697508644648,1 +cb,f1,0.35614160133048234,,1 +copa,acc,0.67,0.047258156262526066,0 +hellaswag,acc,0.35530770762796254,0.004776283203468103,0 +hellaswag,acc_norm,0.4366660027882892,0.004949589567678897,0 +piqa,acc,0.691512513601741,0.01077616467803716,0 +piqa,acc_norm,0.6800870511425462,0.010882873582092062,0 +rte,acc,0.5451263537906137,0.029973636495415252,0 +sciq,acc,0.795,0.012772554096113112,0 +sciq,acc_norm,0.763,0.013454070462577957,0 +storycloze_2016,acc,0.6322822020309995,0.011150439885470124,0 +winogrande,acc,0.5351223362273086,0.014017773120881587,0 diff --git a/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_1.json b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_1.json new file mode 100644 index 0000000000000000000000000000000000000000..60eceb8c7fc3cb6d94b1e7171c73852fd21decc7 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.01489959724281148 + }, + "anli_r2": { + "acc": 0.351, + "acc_stderr": 0.015100563798316402 + }, + "anli_r3": { + "acc": 0.3225, + "acc_stderr": 0.013499258621103244 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644648, + "f1": 0.35614160133048234 + }, + "copa": { + "acc": 0.67, + "acc_stderr": 0.047258156262526066 + }, + "hellaswag": { + "acc": 0.35530770762796254, + "acc_stderr": 0.004776283203468103, + "acc_norm": 0.4366660027882892, + "acc_norm_stderr": 0.004949589567678897 + }, + "rte": { + "acc": 0.5451263537906137, + "acc_stderr": 0.029973636495415252 + }, + "winogrande": { + "acc": 0.5351223362273086, + "acc_stderr": 0.014017773120881587 + }, + "storycloze_2016": { + "acc": 0.6322822020309995, + "acc_stderr": 0.011150439885470124 + }, + "boolq": { + "acc": 0.5581039755351682, + "acc_stderr": 0.008685806399014942 + }, + "arc_easy": { + "acc": 0.5113636363636364, + "acc_stderr": 0.010257133441117113, + "acc_norm": 0.4617003367003367, + "acc_norm_stderr": 0.01022963982061052 + }, + "arc_challenge": { + "acc": 0.23464163822525597, + "acc_stderr": 0.012383873560768673, + "acc_norm": 0.25853242320819114, + "acc_norm_stderr": 0.012794553754288679 + }, + "sciq": { + "acc": 0.795, + "acc_stderr": 0.012772554096113112, + "acc_norm": 0.763, + "acc_norm_stderr": 0.013454070462577957 + }, + "piqa": { + "acc": 0.691512513601741, + "acc_stderr": 0.01077616467803716, + "acc_norm": 0.6800870511425462, + "acc_norm_stderr": 0.010882873582092062 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_2.csv b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..7a85e065cf94c01f2e068875a8b4e86993f9de49 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.332,0.014899597242811476,0 +anli_r2,acc,0.347,0.01506047203170662,0 +anli_r3,acc,0.345,0.013728421539454876,0 +arc_challenge,acc,0.2150170648464164,0.01200571763413361,0 +arc_challenge,acc_norm,0.25,0.012653835621466646,0 +arc_easy,acc,0.5202020202020202,0.010251405621305368,0 +arc_easy,acc_norm,0.47853535353535354,0.01025032515945666,0 +boolq,acc,0.5571865443425077,0.008687668766930825,1 +cb,acc,0.4642857142857143,0.06724777654937658,1 +cb,f1,0.2990049751243781,,1 +copa,acc,0.65,0.047937248544110196,0 +hellaswag,acc,0.35172276438956385,0.004765320784902128,0 +hellaswag,acc_norm,0.4303923521210914,0.004941191607317911,0 +piqa,acc,0.6931447225244831,0.010760295070580366,0 +piqa,acc_norm,0.6920565832426551,0.010770892367463676,0 +rte,acc,0.5306859205776173,0.030039730592197812,0 +sciq,acc,0.822,0.01210216767618359,0 +sciq,acc_norm,0.785,0.01299784381903182,0 +storycloze_2016,acc,0.6221272047033671,0.01121221988713706,0 +winogrande,acc,0.5272296764009471,0.0140316316298277,0 diff --git a/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_2.json b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_2.json new file mode 100644 index 0000000000000000000000000000000000000000..54a90cf8924939b968b8094298c8cbbf25d59f92 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811476 + }, + "anli_r2": { + "acc": 0.347, + "acc_stderr": 0.01506047203170662 + }, + "anli_r3": { + "acc": 0.345, + "acc_stderr": 0.013728421539454876 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.06724777654937658, + "f1": 0.2990049751243781 + }, + "copa": { + "acc": 0.65, + "acc_stderr": 0.047937248544110196 + }, + "hellaswag": { + "acc": 0.35172276438956385, + "acc_stderr": 0.004765320784902128, + "acc_norm": 0.4303923521210914, + "acc_norm_stderr": 0.004941191607317911 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.030039730592197812 + }, + "winogrande": { + "acc": 0.5272296764009471, + "acc_stderr": 0.0140316316298277 + }, + "storycloze_2016": { + "acc": 0.6221272047033671, + "acc_stderr": 0.01121221988713706 + }, + "boolq": { + "acc": 0.5571865443425077, + "acc_stderr": 0.008687668766930825 + }, + "arc_easy": { + "acc": 0.5202020202020202, + "acc_stderr": 0.010251405621305368, + "acc_norm": 0.47853535353535354, + "acc_norm_stderr": 0.01025032515945666 + }, + "arc_challenge": { + "acc": 0.2150170648464164, + "acc_stderr": 0.01200571763413361, + "acc_norm": 0.25, + "acc_norm_stderr": 0.012653835621466646 + }, + "sciq": { + "acc": 0.822, + "acc_stderr": 0.01210216767618359, + "acc_norm": 0.785, + "acc_norm_stderr": 0.01299784381903182 + }, + "piqa": { + "acc": 0.6931447225244831, + "acc_stderr": 0.010760295070580366, + "acc_norm": 0.6920565832426551, + "acc_norm_stderr": 0.010770892367463676 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_3.csv b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..f65ec384550be43779c843e098eb2c3425bbb39b --- /dev/null +++ b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.337,0.014955087918653591,0 +anli_r2,acc,0.356,0.015149042659306623,0 +anli_r3,acc,0.335,0.013630871843821479,0 +arc_challenge,acc,0.2158703071672355,0.01202297536003067,0 +arc_challenge,acc_norm,0.25,0.012653835621466646,0 +arc_easy,acc,0.5117845117845118,0.010256933475911013,0 +arc_easy,acc_norm,0.47264309764309764,0.010244415164390536,0 +boolq,acc,0.5571865443425077,0.008687668766930817,1 +cb,acc,0.5178571428571429,0.06737697508644648,1 +cb,f1,0.3270735524256651,,1 +copa,acc,0.68,0.04688261722621504,0 +hellaswag,acc,0.3527185819557857,0.004768395354146806,0 +hellaswag,acc_norm,0.434973112925712,0.004947402907996247,0 +piqa,acc,0.7072905331882481,0.010616044462393092,0 +piqa,acc_norm,0.6855277475516867,0.010833009065106565,0 +rte,acc,0.5306859205776173,0.03003973059219781,0 +sciq,acc,0.829,0.011912216456264606,0 +sciq,acc_norm,0.797,0.01272607374459827,0 +storycloze_2016,acc,0.6280064136825227,0.011177095517223673,0 +winogrande,acc,0.526440410418311,0.014032823874407224,0 diff --git a/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_3.json b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_3.json new file mode 100644 index 0000000000000000000000000000000000000000..42dd904468738fb6afe156fcfec4444a840f8c12 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.337, + "acc_stderr": 0.014955087918653591 + }, + "anli_r2": { + "acc": 0.356, + "acc_stderr": 0.015149042659306623 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.013630871843821479 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644648, + "f1": 0.3270735524256651 + }, + "copa": { + "acc": 0.68, + "acc_stderr": 0.04688261722621504 + }, + "hellaswag": { + "acc": 0.3527185819557857, + "acc_stderr": 0.004768395354146806, + "acc_norm": 0.434973112925712, + "acc_norm_stderr": 0.004947402907996247 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.526440410418311, + "acc_stderr": 0.014032823874407224 + }, + "storycloze_2016": { + "acc": 0.6280064136825227, + "acc_stderr": 0.011177095517223673 + }, + "boolq": { + "acc": 0.5571865443425077, + "acc_stderr": 0.008687668766930817 + }, + "arc_easy": { + "acc": 0.5117845117845118, + "acc_stderr": 0.010256933475911013, + "acc_norm": 0.47264309764309764, + "acc_norm_stderr": 0.010244415164390536 + }, + "arc_challenge": { + "acc": 0.2158703071672355, + "acc_stderr": 0.01202297536003067, + "acc_norm": 0.25, + "acc_norm_stderr": 0.012653835621466646 + }, + "sciq": { + "acc": 0.829, + "acc_stderr": 0.011912216456264606, + "acc_norm": 0.797, + "acc_norm_stderr": 0.01272607374459827 + }, + "piqa": { + "acc": 0.7072905331882481, + "acc_stderr": 0.010616044462393092, + "acc_norm": 0.6855277475516867, + "acc_norm_stderr": 0.010833009065106565 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_4.csv b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..529e0cf8050944504b467636cd7973fa3c7eeb3d --- /dev/null +++ b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.342,0.01500870618212173,0 +anli_r2,acc,0.343,0.015019206922356953,0 +anli_r3,acc,0.35333333333333333,0.013804572162314928,0 +arc_challenge,acc,0.21843003412969283,0.012074291605700985,0 +arc_challenge,acc_norm,0.2525597269624573,0.012696728980207704,0 +arc_easy,acc,0.5185185185185185,0.010252744217435635,0 +arc_easy,acc_norm,0.49158249158249157,0.010258329515226445,0 +boolq,acc,0.5584097859327217,0.008685178933161664,1 +cb,acc,0.5535714285714286,0.06703189227942395,1 +cb,f1,0.34722222222222227,,1 +copa,acc,0.67,0.047258156262526066,0 +hellaswag,acc,0.35480979884485164,0.0047747781803451905,0 +hellaswag,acc_norm,0.4326827325234017,0.004944351065545849,0 +piqa,acc,0.6947769314472253,0.01074426704560648,0 +piqa,acc_norm,0.6849836779107725,0.010838072746240652,0 +rte,acc,0.5018050541516246,0.030096267148976626,0 +sciq,acc,0.827,0.011967214137559953,0 +sciq,acc_norm,0.796,0.012749374359024391,0 +storycloze_2016,acc,0.6258685195082844,0.011190071893524303,0 +winogrande,acc,0.5248618784530387,0.01403510288362775,0 diff --git a/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_4.json b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_4.json new file mode 100644 index 0000000000000000000000000000000000000000..f7273250f2579136f0c6e4aa0e10d6083171c0bd --- /dev/null +++ b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r2": { + "acc": 0.343, + "acc_stderr": 0.015019206922356953 + }, + "anli_r3": { + "acc": 0.35333333333333333, + "acc_stderr": 0.013804572162314928 + }, + "cb": { + "acc": 0.5535714285714286, + "acc_stderr": 0.06703189227942395, + "f1": 0.34722222222222227 + }, + "copa": { + "acc": 0.67, + "acc_stderr": 0.047258156262526066 + }, + "hellaswag": { + "acc": 0.35480979884485164, + "acc_stderr": 0.0047747781803451905, + "acc_norm": 0.4326827325234017, + "acc_norm_stderr": 0.004944351065545849 + }, + "rte": { + "acc": 0.5018050541516246, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.5248618784530387, + "acc_stderr": 0.01403510288362775 + }, + "storycloze_2016": { + "acc": 0.6258685195082844, + "acc_stderr": 0.011190071893524303 + }, + "boolq": { + "acc": 0.5584097859327217, + "acc_stderr": 0.008685178933161664 + }, + "arc_easy": { + "acc": 0.5185185185185185, + "acc_stderr": 0.010252744217435635, + "acc_norm": 0.49158249158249157, + "acc_norm_stderr": 0.010258329515226445 + }, + "arc_challenge": { + "acc": 0.21843003412969283, + "acc_stderr": 0.012074291605700985, + "acc_norm": 0.2525597269624573, + "acc_norm_stderr": 0.012696728980207704 + }, + "sciq": { + "acc": 0.827, + "acc_stderr": 0.011967214137559953, + "acc_norm": 0.796, + "acc_norm_stderr": 0.012749374359024391 + }, + "piqa": { + "acc": 0.6947769314472253, + "acc_stderr": 0.01074426704560648, + "acc_norm": 0.6849836779107725, + "acc_norm_stderr": 0.010838072746240652 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_5.csv b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..523a858695c1571479ad9d30207cd02cd3710331 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.34,0.014987482264363937,0 +anli_r2,acc,0.34,0.014987482264363937,0 +anli_r3,acc,0.3516666666666667,0.01378971169540479,0 +arc_challenge,acc,0.21331058020477817,0.011970971742326334,0 +arc_challenge,acc_norm,0.25170648464163825,0.012682496334042963,0 +arc_easy,acc,0.5122053872053872,0.01025672623512901,0 +arc_easy,acc_norm,0.4831649831649832,0.010253966261288898,0 +boolq,acc,0.5593272171253822,0.008683276495829012,1 +cb,acc,0.5535714285714286,0.06703189227942395,1 +cb,f1,0.35469755469755465,,1 +copa,acc,0.71,0.045604802157206845,0 +hellaswag,acc,0.35381398127862973,0.004771751187407021,0 +hellaswag,acc_norm,0.43815972913762197,0.004951470301995878,0 +piqa,acc,0.6931447225244831,0.010760295070580371,0 +piqa,acc_norm,0.6806311207834603,0.010877964076613744,0 +rte,acc,0.5415162454873647,0.029992535385373314,0 +sciq,acc,0.829,0.011912216456264604,0 +sciq,acc_norm,0.803,0.012583693787968132,0 +storycloze_2016,acc,0.6290753607696419,0.01117051962469349,0 +winogrande,acc,0.5209155485398579,0.014040185494212945,0 diff --git a/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_5.json b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_5.json new file mode 100644 index 0000000000000000000000000000000000000000..db677ea71469daf1b2a335ad0e946479ccf1a257 --- /dev/null +++ b/1b121b21bc4seed1/evaluation/rankeval/1b121b21bc4seed1_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r2": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r3": { + "acc": 0.3516666666666667, + "acc_stderr": 0.01378971169540479 + }, + "cb": { + "acc": 0.5535714285714286, + "acc_stderr": 0.06703189227942395, + "f1": 0.35469755469755465 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.045604802157206845 + }, + "hellaswag": { + "acc": 0.35381398127862973, + "acc_stderr": 0.004771751187407021, + "acc_norm": 0.43815972913762197, + "acc_norm_stderr": 0.004951470301995878 + }, + "rte": { + "acc": 0.5415162454873647, + "acc_stderr": 0.029992535385373314 + }, + "winogrande": { + "acc": 0.5209155485398579, + "acc_stderr": 0.014040185494212945 + }, + "storycloze_2016": { + "acc": 0.6290753607696419, + "acc_stderr": 0.01117051962469349 + }, + "boolq": { + "acc": 0.5593272171253822, + "acc_stderr": 0.008683276495829012 + }, + "arc_easy": { + "acc": 0.5122053872053872, + "acc_stderr": 0.01025672623512901, + "acc_norm": 0.4831649831649832, + "acc_norm_stderr": 0.010253966261288898 + }, + "arc_challenge": { + "acc": 0.21331058020477817, + "acc_stderr": 0.011970971742326334, + "acc_norm": 0.25170648464163825, + "acc_norm_stderr": 0.012682496334042963 + }, + "sciq": { + "acc": 0.829, + "acc_stderr": 0.011912216456264604, + "acc_norm": 0.803, + "acc_norm_stderr": 0.012583693787968132 + }, + "piqa": { + "acc": 0.6931447225244831, + "acc_stderr": 0.010760295070580371, + "acc_norm": 0.6806311207834603, + "acc_norm_stderr": 0.010877964076613744 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12d4fc43a38b5d782b66361b8d8471093b0f65aa --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68bb4cc1d28ed6b9fcebc5341b11c16d8d02f1d27e0b0974adc4f7c0393d239e +size 51395415 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..933f14e45bb003cf2c832665650ce12804ee2149 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15af8c0182970a7fed9f357dd4d42962ec9f84bef3ea5235345ee703b5fe96a0 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..666a0a8b632da0576728b8ce93b57d95abdc9aea --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cba3385be5bc89ca7597c839c432ea9bb3b9565e3a321b266834205c67de480 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f24a4df49a9bd3495f0e0ad43367805e774c37bf --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceca10b2ca5434eeb71d08414e35e959d73b48af32a3985f248213c4f70e6fc7 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f941357d6d225eb0064cc85951a8a4c615efad64 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ae58af3626c2780bca8e3156a29dfea0a633ea66b31e65f180e61cdbeff8241 +size 51395565 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d80b30b5c2d2bca14b0384e549529064d944e26 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e8234536b0c8295ad629838b8fe8120a231636a5b1b2609ac651c9020315a6d +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..993288c3d802e7babbf82450f990ce8dc737df22 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83e815ea650d86f66caf318aff67d13c60b0fdfb6f92e130ce581164f39f31fa +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..198f55dc83bd6b0bfd14ceccb4632132f181938b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:733803e6ff21bbbbf76f56f0f0d8eab54d15fcad3bfb65a026b7e785ae561a19 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ab1f3f100cf4e2f2840a243650168e74c2d4ed1 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:692d06b268bc7921295e4de437ab657e0678626524caea673e12510916f3daea +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05761b6154732d5510ca1529c4bfb64eff061b00 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15c67a6f5346ea6001fb22776e8fe9cb094925714453f3de78e60f49fb5aa27a +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d12879c93c5c5a828a09cdb1b637f380d998f06 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97cff611d9bf4be5b5262fdf31529d7ea473bef37a6ef6ce36d12fd8122a1c42 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..146b65ef00febf1c2f08d97d50f07d18724427f0 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:914c5cb8071a821882bb1c2645289e04156f8ebe1e306e34aa3a72a5b4c3ff43 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1103bed0244f1084602d08f97df5f1a21eacaf52 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c49570ed9f2beb1df8dc8002d76102a2640de8b92644de1999fbe3dab20243b4 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3035feeb7827a45e446652216716e894a000eee7 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07006150dad05a4ca9ffea4fc473367554069a4edb7dd060dff4638d8618bee4 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6035dc72ee00abb8920558c83cb2912e47280b38 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62d6de1817d27f84f88f96cfd6108026c38cefd3d736f3f1a5455a94bc2e07b7 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17ec132825a26fadac372a3358d6511de00471fb --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a093d742c5765d3b18790dcb91d960213862e2d8f33947c59fa3f7f6138bbba1 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9611c1caab3dcaf53b488a8e59b43470ce3f611b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cec6c9349dae436fd950b358220072c8f1fce46deb269cd1c044791fecb83ff1 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67b07d67e466c8c490d589140d8f5d015ab8567f --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a851b7349d95753e8b0f603f826e534273b760a28411ac7cfc7489a59778e17d +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bc987c724e8e54fed5cb574fa4d21c6da801527 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acfae6a728dba5685fbfb4927d27856fca55f0a3759334cee803f6fc103fe3ab +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16f5f7f7959cd39981b24138d9b82677fab92bd0 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8ed995cfa360821e943b008f8da7f8227475f0bc30d117b2eb6976515d7e12b +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce1284d4348dc103ef3c3688912618e7aed424db --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f723b2aa296a4a33879d403a3d9ba3bbc2d0555bd61d30eb54df0fa41f2ef41a +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c528e0e915ca09fe123f380233dbd1ad9b254f9e --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ff0c0da4935d29329dc9511d1928f806f07d325b4eade8358f40b558ec17c2e +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87e122c72c9f33c06265b802bd6912a947b8689a --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22771c7805501ecff970bfe7ae3742c19529690b1b7edd04d67ff3b9e6172cc9 +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b814b53a2e57aa5c7baeca8717a5786a468aa3db --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69548590155f4843a2c89da426df404e058161a8cd7942e14841d0dc3537fe59 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19794df64a2cbcdfc8c91bcaee90c03245b3841f --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a926e7b86794ebf278753a66e0601b1e2488e7cdf2632c729dbdfc77df29ee9 +size 51395565 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38edf67ff70984897672d3cf9ab2a4ac4e4a440b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f85e635b16f47404ecd41fa922cec05bb0fb970c93a69279e4c82f09dd84fb95 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..033cebf7e2387caad6d3141518614e0bc8e87dfa --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61ba7be3c8cc482e1b6ec13415e67d0adbd48b509b44a91efa735967bffa41ed +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8c3f0de7b9237e946f35f5b64f136df2fdf002b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ce7ad769c004572f7ccffc760a643124f59a05d320e34ae0b14c26458792ebb +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2b9c19ea0f4a22ddc768c4f8f9d7ec7fd949813 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2c20734013ae4d24948098e975e74c5e9902b506de9e6fb4437cb79c35ff894 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c81d3d33e260a134864f70304c9e67bce15f36df --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0db8b535d04069156e9122d3638be2bfc9528194285bbfd3fc92ed2161b1b6e4 +size 51395565 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3355adb73e40414a67546bfb5564f668f89b4619 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4c2128b43cc7c4f992eb1daf97311aee7e796fa39708fc5b714e1656013857a +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe2033da21804273bea534e8b3a94c9cb43914f5 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaed43f8e68022894611d10aeb496a672833ffc040de8e8c2166ee6943504bf3 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..197402aa7709b1e1c5822ef125f895b2b43ff920 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:846fad34d70eaefbe7e177bdd68fa813ac1bdf5111c4712a8eca380d2908756e +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83decd859f10664d16cff07d07d74e1391216386 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:125dd2e65f4a52356c7e265c4f44db9bd2f5b6d72dadc8b87fb3149b52012f72 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc42ead0921fb21a211b5d65b8f0a22a0a58bfc3 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d867a7190e3e28a1b952ec53848c2f3cd5fbbc4e8d57beae133baa8fdb520dc6 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30e8c30372fc3f4dabd8c6e2a30129c22fe13062 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1288f61407f86847a17a439e91576969d3a372626f92631a3a15042b441348fc +size 51395565 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b04e193d84eead48de9e9fb7e27ef451127afc62 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:015493196bcfe4504455cfe29d180c1c82569a654051595e66561e9fefa326a8 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adf5a542789cd502c1efbf4e5198a31fe8de7e3b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ef754f280f3eef2f370b9cd007666feb9d715e7fc9fc6f616bf10404534a4ab +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d19ec223b9f1cf9b9db576fe68006b9d8c44e639 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5eb8aebafaccc0871fba5950204d9561c1432f2aa07274f4084003186c18bc6 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2005c5eb50e8b08d1615a9803926a2b6ce336333 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:485f33aa461dc24fb2972bc1f152403113c7cb89a8424397d5aa19fb63363320 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59cd5d40ab1b26fdb338d2dc3b051a3c28301a03 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7354401bfd7ebbbeee97f5d88179770f3868e3591857c7deb6bcabfe8dff49b4 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bda9cbbf5b14343de2d10786029c6a9961f4961f --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfc443cdf060b9ad2fed03531423c7d78fa3b6aaeea5cc2dca88565bdc7640ab +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c21f465fd2de6e3b1dcc47978ffccadcf968aaf7 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee58ce9422459b7771257b6ce43659f10d2527112bcf085766c152eb08744df0 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1249455916ead3cc474c14060b9f90973469006 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b23fa264b9422fd6f7c49c752f2e570aacdc10211dcd29e8ebc442c720916613 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e279877538860f949310025125541bd7724cfa4 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:315424a5df9b46d98adeaf586953f318670531b50401cb06701776c880034317 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac1cbc2c30e11a56e31c6625f2ab6f34c335184f --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3372fd020602f2d764b95d06025ccbcfb2d8b4f2c8ebbeda6be7c980bd7b44a8 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..930a698ac2dae2f7101fcc2dbe7c550f831ea39e --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d8e1c4dd7c43c7df07db745910d3ecd7e5c146cd95eab34e0492c029f781fd9 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa317f4811462e8862235da5ecd3e0010a5d9660 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15fac648eb9ba41ecc6b3a7a661dcf6bd13ee7fb6116b728119745684b2c9a4a +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b062f1f4c2d902b5fa1e629c3cc15031581bd8fb --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98571bdffbba5af3bc4e4d9f8a6ff1e05876f0af5217f664d8e7e32ada9c9413 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1785b859b2aaf1f591b78b46883180fc13a6097c --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfc61c86c7452e6a0df68d7e3dc76bd74d68a660a2539f36f26e2a6537f766f4 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a79696ef75c844b5619062ee0694dfbe8f1c038 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:784df7d399154780c62d7ff99642febbc4c6b536cc538ba276cffe8441343d52 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74de43dfab45db9821e7e5eadb858dc78591826c --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deb5fffc3f9b6312dad7558c4743963070834c0e297a43ae3711ac6434014b80 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3ffc933344d6bee5b6a5194f05bcc8c04822b9a --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc6832c64aeb6b4edd0596ed0f70da97b74e17e5f855fb40f5ce501d541680b5 +size 51395565 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17a19f27ed273497261257008a74cd1ec12bd8f7 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:713b9dc846f57770d4add1d71adfbc344f2ab86206fc39b92b188f62e18fef98 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96356ba8056a19b007a9e5630af2ae98968b9684 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9e55463a24c2831ddff339a928226f052f549b4a9757ce128619384b67af2ca +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da7a373b6fcbfd094089475e39bb2776de6d1848 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e24fbc5aa2f881eb9f00a1351358d18a53045adaa00b30050b1af20eed526747 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3101d349c37792cc1e16a7501ce7f855d674976 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56842f394d832acb5612f68139302328ffd81063bd234423b5d556032c8cc7bd +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d289545eac16fd79b63699d0b48e3854e1b0619 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9c814f5c49e944247e79321f7c16fa06f25e15618b70906083356d440f0b9a3 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38c9e39b7121dbf1f9829cd064c6009a10fddae3 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc5e662571d6eebe014d126df065db250923755bdb8cc1f96244c84116504a08 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..904a01876c37154d2d3b962a2dbd758131f1446d --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b412ac1909b1e2045e8763974d3cb508cee042177a1c20e1a308453e8caf8e7 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87b264f1779401fff557411e2aae63b8cacfed00 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69361fc9687a08c118701b5549741db51b414d6dabef8d0af760bf6a2359c45c +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e1007f089f97928da8599d78371a25c255e084a --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a08833ccba3128fec5364885fc6dbd91e632992682df4b4cfce3445ff7d6fcfb +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..503f25e788f39df638d7575e2de32cf21234858c --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d591de2b741c2f69fc5b12203d28249594a6017f78aff484cec22edbdf056ae +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e976b298218eaaa980badcc76697ce90dd29a100 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d36d82701d499a06000207d67ab8819262e086717604478980b0133c6b0507b +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..526b59b060832e4849dba72fcd953b98eafa90b8 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74068091939e7a459dc92bfdf00aecd74b56cd55917c70647f148e021b5c387d +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b08d1c346279ca63b083c935be9a36909c5586a9 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f354c7ffffcf3afd9c9eefc935d9462f431a8cce44c06a3b671bf8f6776f5cf +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa30cd7739ce6b2f89cd7cce2e7a8e2dbb335740 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b5b43e0eca4a81d8b8def05204c32a532eabfeb8ad0b24d3c2e5f54dc007395 +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8b195cfeab1023fb9d1cba7b1ee80cc4cab8336 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81130984445c27d3ccf133d4614ff6934263ee7f895e5a6b1c8314b1dcef34a3 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f11cc426ad7058f6c362440c9164885f83da8b9 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c4ffae403818cfdbfc9d5d66e0a144e415301fb6806e18f71ddd6b253bc9f06 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66a2c3761d4a5c916d7f0762e16fc5697d09cc85 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03686371f5a1254502c2cb037b4fd2e8b8a275b2463cf2c674e2d868be640f28 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6ff6bc42ab1fef38afda8cf4099e7e19318d662 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2954f029d4ceb6caf2832b44fa2948394caf1a16f2de1e355ab0aeb78ed7562c +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13cf1fb733f2aff1e7fa05db0a91a2ae1c849867 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbe2a4907358e17d3cc3b0675c81ed71a7e5094a26696fffe10dc8a7b4888d8c +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..401071ab8992a8652dcd9d78ed3d05ae1f57f03b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2536c9e259e53c6fa26c2379de86257e79e018300e6d40a378c1b330e5ff73ab +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..345ab4059cf319566965b5db08705b933e833e95 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b5f5cb245df263a091fd36b0ac7fb108e36a6a784ea5a5dcfba75f359458be8 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9db545a7ce2838a8663aa6a42965e6ceec0581b2 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee9bc4cdfdcc9d5b6b1b27284053cb9d644a179a7783762e9f3cb90e80556686 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e15f8c22805bb6d15c5daff07042b82443c32cf --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf71d5bded90ff873679111d65f344697410e414d8a60b63996189a933504e8e +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba41ff9f9525363e5ef24a2f7613ea1c3af92181 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:364e3153f366314b4dc157df6f12ca73f0fdbc7f2fe433a1187841f7165bf747 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a007ab7e12416fa82be290143bcd09a837cac46 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ef54e9611078c9ba6b36f67071b6bb90eb5441682c61ef47fd6cbc317152b05 +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bdb7020bf10d8d6a53507bbcee4c71c5923891d --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2326521dbb97b2adc3a2d874a0287698ea2f6e9bc6b8556e0667bdff375e4420 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcc9e02155154d46ca96fdd001bd2b2ef5bab89e --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6448d9327da2765a4c8caa8c5c580f82659bb7d91f27a2589f51386677e20c1 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34be7f352e0d39e37e63e5cd5d1561155a68e0e9 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebf780aa743a73a260d6cb7c4ac20344ea4ccdd68fb65f7fb26a0a7b66a223e1 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee2528dfe70136b5bd0a95a65619b66b8dd9fa36 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:737c1cb1dbd59cf8cd95027b29b8a12dc575bfa86fae85d451a46c9174d531d1 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37102955d4ef214bde382b69b5e58576508db23a --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:423cf0e2b543871d90db1ae5a64975bb0c4a0121a552035ea5cc8e116a4799cf +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f76faf0d43ec79999e86c05ef6395f5bd7a5c824 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e02e92bd82de63651fdac4c1c5d6b8e45a1aa8be59327395c5f4412ca8dac6d6 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8bc851bb7258b245600b056cc74dc860a10c9fd --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06da98c5b1611a38c98d6c074756b1f272e5c02b76167465c886023a901e45da +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6643e3a170117676cf9c8470b5286a9321a6b99 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4571c8d67185e783880ae6cf12f2e53d9851ec6ff919de9e1d35aaf70c04434a +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac89626b7baeaaf8b352c2ce73df4c4249bc2bfb --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e94b7be61d234a2047332c928eddd5070269fb90c4d828b2cc5f887c0e8cfbb7 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da5fb9094b5caf5b29affe5b24ba1ad01666ef95 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70363b23a37c10048438102348fdc4701c77c007ddb2b63843da26400c588deb +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac3160d3116aa66006b9f57595f4b70992f8d3c0 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4971cdcd4b39ae29a431629073e557b7cb969f95d00c2a6b69fa761269d565ce +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64fe6bab6d69aa5d98828418ac3f2768f624a1b3 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8006d595ec01a0dcdeffa49a3b9e45ca3f3e086a266c5190cfe820819a605d9e +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..534cbf9e077303e08a5eba070a1a041543f60d25 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7e4bc3c0bbd250b94490dbfb5e1302406476032577e8c53a590c72471b21e61 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09038415dec50d765b4ff22aadcf1a256650cfa9 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef161fbc670452d0c12179ae734bb67efcc8fd4b0c8dbb5b9fe6c81e440876d0 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa335d9f46a82e8e0cac6c3aff2a294851187923 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c548c1744d8c978b5e6c30a3a82001691465dd142128f39910d4365fc67dfa5 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05b7aa1d402050351e0e38e44bbba9f32e402b49 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28308d9b9f46c92cc6e25d58da5e2e360738c2b32c826ed623f7ce2009a72cae +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3bbae2318db102d30cff3b4e7c578dcf1a6ae08 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:661e36f72437f38e61a1e130cfd22421d11a20cbb36ca638ffd209b9912b22ba +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57e5f7f2bbfaacf9388c05c1762ad2d4dffa4d6a --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1daf6f6c75e0d33b1ccf52f239d8cba71428ef265dfba83ca23b2b9830f3ea3 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa0b014e95c9120115d848763066fc3fdc71aee2 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ba9f6c9f7abebb2f454b33d629d2f047fa83d3722917dc3ca02ee9509d16925 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b453aef0f7deea7504685ff5552203826f86af8f --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02725cdc832b2227e120d66060932d090274fd49839fd040b884505eb63e2b40 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cdc44ed9e246db05d6459c88fb1e37c38a90ba7 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca233d3def71cb7f59e300b21d04b3bbe2f3c0877031bfe21ea0899446c41f97 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f50f6ba5147f49bda14cad191ce61533002a47d2 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dca9cf13a0b5046f38ad5eacddb96fe4242198c67496341225e86d0042672119 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d7a5f8287c9c7e41fb59630c4cb34197c9745c9 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae082f4de80d80e6e92ce461938cbc7de12fcb038f102f322910d8cd92ef61b1 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6536773e228123e4c74fd9e43c12e56a1428ce9c --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6abb7b78d79ffb9ada1fe049d13d40df5e94b4eca1515688f20d1ba8e24b538 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a91a1430feba3adb20fa70b1506226178ec88b91 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d0f77d2630098ac97402d9bdd75834d642821f4d2d8d333903b712f465e0e35 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb96070a2c7d03d63ebf538d66de20e23423459b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3197303fec6a26948adb9ac7a6748a69cd34380307e36aeb5e71b1d0fd0a515f +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..116fde9a666cef1122b044979a7fb96c6a28c50b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04e1b7ba2545711af7c828386248c2b34f0fba384b0baa097e8d73a7ca2a01f4 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef0a9a8ff20af97ac20fa460e8c23481c8d84fd2 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d7e7f0a4108572c2a4edd8af8610dcb2eb9bc23b9f35a0b0822b4aac73fa81 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6fc3ce3eb86e6ddcfd776956ae1b3fe77defcc5 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa119e5379db56ede7335a3a144f6d8e4ab68ae1cd47869d8a626dfdc84fd7cd +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a8d690dcfd33199767aeb9a4fad57137d6a679c --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d489347726cffd9c4fdc1c9a7172a80790517f259d820a128ebcc954ccfb0497 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a128480b406b9c7bb6b1e63c907c1a165ae2ab11 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4815aad5782fdc2462573154728aaabd0bca1830f5e80363d378f4884568d46a +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9184470db7d91b65ccf66a6b5017f85e305efd3e --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db2b9c0737892835f111ee4e7fb04e25c88c506153c7bbd2a7d6b74488415289 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccf7102cd8e756506c445cd9b4c4f502ce036e90 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0256835992318beb81937b4b317122e286a87954e2bc56588e0a165d62363c4c +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5a96e64e71cdec8a82eb3325c533f5591472b06 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8cd28289f1380ede7af9f2f984cb3992012e7e2ffbcaac4e63b36f5dab642a1 +size 51395415 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24775828767220edff1f6de335264a3604783855 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c97469e02e670c3935722011e19378a1284d8aef57d1a74c933cca49d4ca0f9 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89242986f5a58ea6b113b2d7d84ec6aa898ba74c --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:669d8db05a3d83b59efbb35bbb186a0cf87c7f73046df62d77257005957805a9 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc7d449613eb32fc1871c595b95c2ef674945567 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efe7d55163e1673167c1386f7da0f0fcc978b4a769d5398736940ccef770c5fe +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1867dbe8b5b774945d06f280bd98830fadfae043 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d89eb79eebb5b07485837fcb9ce2b00009893f7f9e7fe314a5edfdc117f1e62 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..785bd5e3f810693dc6472e3a01eb64b76e268407 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b242c2479d432ab6816637e8797c88b73643c33f1b7b20372b8b77d94a12d53 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d9728650312db1fa524b5cfdbd7c23c47935658 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b58ad1a4d0b6769955f3d88333d7c59ced94417269e75927ffa6e43ea2d77b4 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..887d251fa81a27df35f2499911230b4a7b3df2a7 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d44add209fe1e15f0acdbd191dfbf97a11097441e1fdb7124cf8ce02a9f46f2e +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a264c90f9902e28546938c4e840107719a4b4752 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bfb1987a1ee0c1ba82235d322ac182e20017ac62772f95703755196edf30749 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de802eac7b17c5199d37de2baeddfbd2675f3ef3 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17a09576e5f33ab38cde19748b338a2cdce9fe9a546af556e2628d371c51e961 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0af62f44566312b47c9423141f26d21f71d4fdff --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67df12c39b6347f27d2ab0297b63f428142b440bc0ae7f74f397dfe1e748b639 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24b1d83abb37b4597acf91cb38aef60a04097304 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff47bad8c40a4fabb99e87cb37e94947abbe89f9045687b5fa72e30304f71e59 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4168be989eeb31c14af8e8bdfeeb139d10c45de5 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94fb35d57b0dbbbc7e8abcbcd42902183b902b8be3841b12939b02859ec25ac8 +size 51395565 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cacfd22d5bb5008443bb3d26a5f02c97a3a523b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cdf7c1e9c32b0adb9754cc2b068ae2cba07ab05aa30e76df3e3241152775ace +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b60fcc4bd1366030f0b8a27ffb30a9042411ca1 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e35c7c6c9dbb091bc5f48bcfe3b8ff4c97729a2d3abb5b10de0a3bd09228151 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f73e7a08a6b7b60de6f28ad3ee24dc11e4609d62 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d0551b24d3a3a5650fd93251faff1f216ad15586658dde4188a7d7d83bd978d +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2812835f007f0dd55c346b43b792d7d91502e998 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:072277b16746a88ee9069e32178228304f4d49520305f1584353a28ea88067f6 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7d0f8953ec27ade0807251232154c1e86b9c76a --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3457f1eb8b84eed2b433efdc8281c3887ec808685ae5001b3fe2bac375c160c9 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e4734cf0745a45a5612b8d4598465e24bb93bc4 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f63909e089dca0a61e11b843b7d6fd47e63f910e655b23b17ffb40533c01acf7 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8945c60d87fe4c33737fb8f94f1eec4619c30a5 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:231edb15be6ee25219b6a7d17c2d9124ddf17c234ae3968b8e1d06772b09787c +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b68e5b55c7b51be2f4e5b0207b37cfb866806c37 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dff09d6e7014d3f762e002015c4ed54c0ab4edc175aedc4fcf12b62e35c1cf1c +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..879276dc8a059e3486a7a060ac700de8f212aa0a --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ff03096cba6a86f1ea0e48f7afcca4088768cb77edbaacce7ddb51cd6042fc7 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1f16469f247dcd4ec2fd4ad6738d216a287fa23 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a408a96d128c0aae5d972f1a7563a9048eaa0006ea77e53e1e09bf80696dda23 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c21be4af140a3641586fdb77ac89ef7da863342 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77b52b7af54c9c978b3adef76e95a84ed995a7c3f48a1b936170847bc97d679f +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2e0d687080d41a1158280ba6830e6dc52e83b22 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccc509cf91135cf7cd5f45dc9927daaa5be926160e86cf0de31a985888b4d143 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57b058626406af85d1f2f3b88a0702e3fc421bd8 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad3e870d17b1491f5efcbe9393e11cbe253f712922e3d3e10d17a66fda29bb21 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0bf47dff186d1f4620a9f303c56ffe348d5c621 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df9486d778d9876b91799d737fd53d07418504e5ea0ddeae558b274ef8fe38b9 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9905065964cb96480f123884fa20aa55c01e6d66 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a73cac37988fa0168b2f188740b49f44ddfd0f2fad5b2f923a0685618fea90 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62e44e7fe752df72517641431020bfe2a4c737c1 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eadd2165f62ab45adf39499d6c3240966d82021773366952331bd4e4884939d +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fcdac57d9f9ea9a1546576c5ec9ba95a7319b19 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d11cd51cc777e33b357248463b287c11413f334e7c8bcb23fd2cde03832f4027 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03672cf737169f1e9ff93e7fffcf04edef21c9c9 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:463033e6733dd24be8ada04414ff7fa3603344ea342e7aaf4c70b2cb768ef642 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5402455562966295415d82603360dc0196722fda --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ff2bf90a932bcb12466fba5f5e2c38858e63ce11262f87fbc66c65879b12542 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7048776f106389b81219e4c33c0fcf3c3f09d92 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99de264e2c1bc05fc097156190c04b773b213a12078285b6baccf47903ca5ad7 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2f92bb60fdb16ae3f02f52d27a7394b86a5afc8 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aba3b68c8f35586944b8ccaa42e1196c59b18d9102a723fc4ef2c65e4e19e10f +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c7fa530adfc89697647a9e7702d232c5a086791 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:642b84e3b66bde991300772741ef4c22dc81f38b11054292bab520dded5bc17f +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98293f02011ae3092388c2c6910e9dc124e4284c --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4bfd8f87cadbe4d3a2fa7da7cbdfa215838d95a0bad68d99b5f647b3e0ee14d +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ec55eeb414a5a5c25c8ae21b007fc8e586db8b3 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cccb539fb19ecedafac252f4c60ad0e37e0b4bc7d5a76707b31d2549160a52c1 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5cce29923b72985bf30eda5ecfbb8990397e15e --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:493104f7475891b359352e84e6a1955afc0d2022e332d85d213cbcd7f8c9f16c +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c01eeb85d8a8514fb35e17ca7e05791585da62c4 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfc6182dedd374515db1041cae6fae01fca08dda5ac883dd8a83445e7d0a24ce +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4cc1968ab0af1b91f578c292e9157c7efaf58ff --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99d0612abb3127e5cf026073fff28ebd4bdbed2ebf9d5e5a8bf0510960a28ca0 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09d902af8dd432fffe434ec3c3660cd0fa7ce47f --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab3d47f9d6c460dace51207f199b5939c8f54b92849f42551f11fa9b420f677d +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ff72e5cb03eb24dcaaed4fe36ea3120d7d1cb89 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:056a9819d301bb4f21b03812164075921452491b2bb118b721ddd0251b7372be +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f26daf5ef91e4d761f2bf426f3f5a5e98762b7d5 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7187dded5f1ab9258f96f41509e38164848e70892510b6631ec3ea90a327e1eb +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6115b4b099e1cdf4cb0a00a12e5d4d638b23b90b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13ead07eeb7725b52349fc7ef03f18820f0e09c0cc841ccaeb7cdac6434244d7 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03696b66fe6668736145ef751d7e0a6d877d84cc --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ddf8bc4e16bc31b529dc3ad705f3a17a8201b560a8bc84f3dc37be403e1d575 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a9b48e75d300ddb0bc055930d168889357dfc42 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45d942e3669a9015ca9d847cd9a3d898008f902961ccdbbb02fe13f26e1fc1a4 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7c9043abd06d5f75116737699354693edbacd01 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b4ba4e3c0c8f8d3b133d705557a795b093f5d378579a986ae04c104512d815b +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52205cc3c6270589cc832b48ef092d264c489319 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea51bf6e8a94fa9706324d2339eddcb1bd23d94ec1069c242290970d5fa67868 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fef075aabbccb858f26bcab07be75970b6118436 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ad3cbb3907bdb134197dd790670e769d799d5ce605f1f0692d45bce6a9f6e03 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a01e3ea469c5fd0e6140c4c7ea15d508fe388ec6 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79c939fc343445113f048ffafd097d309302c2cc14a9332d5439c8db54b196b5 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6eb55ea92d90acff862575c88c3da6334baaccb3 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b178c52982e74053ba2481b2c9ec06d7f83580db7d75aaeadd46dc3bae42fa5 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ea779320dc001a3053a047a4cea5ea339204d12 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4041a744eb40ecd3a16891ef75dc3cb271d49d0b3a8f6d738213f241e9e39308 +size 51395437 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ecad5013ffa4ab038cc2d7ea12f9c62d63debd7 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7814ca661a1c3e45bbb9ed759eaf0dd7404a2f1796d1c9d4a0a73b2cebe5761f +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f43a36b9667840757e7b0a5a1bcbde193bfb78a6 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07a75a33ab6344a3dbde8848151d0258e4c77922168f4213c9d8d4c5ad2ed5e2 +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5df4d7166e6ed5e814ffeac420d09a271962982 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07cf66495bd2fb11e90ca1880cd9154ba178ba3c1528035b2456492e898ff913 +size 51395565 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53594b15d4261f85ed93f97a6844a1d2ef47c372 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb71be1bbf6437824b5341148ef750bd0280fa79a7100fa68985f04510974f48 +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f929218f625abf5392029b8851c7c579f0b4d7d2 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee0fcc5aeb6a5e86ec31314c3c3f2d333173b0cb8a8a28b2f54555fe041644cb +size 51395501 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba8190ea6d4dc05edc078d465282f84a22ae0e9d --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec1d3ea3f68bc67d4a6107095f9c5e1ed612e2a15e4ad8283880c4600752bd40 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c34e6ff414034312bbbdf0af3115837649f6e541 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c5684a738e2c0e497cb42f67b6e12f40d80c5aacdfba0157b8fbf998a2d930f +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84fc0463de0ecb3fad2bf143d28dfc6538be249f --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f04b68166e81968ce032aa81b741eb73a70ed3f5f8281295a2dcd0747ae6ad24 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2b7ccfdb0d17ce8c061026d4576772b30c1e96d --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecf05640a4e774a75081f310a16912353591f0996685fe3b92c1009a2369ba6f +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfc48ac87e45f5eee7769a8322e9b16526241064 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5947b1a216c789f6fed3c85d7b2621419c9efc9f2e4fe6b5b7251e66647d512 +size 51395373 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f600f9e5e3452d105a20c938276890843c30d564 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b92b3adf3632392413d9adc77971e51c59ec397d1d83193705c8f7b0cd21f54a +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..968de5c82c93a7ef32db3ecd53b3afd2c0b8e882 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47ea6616b94c7b14835bc750da66bc8fd5aa8b9217b0794edc8bb2aea524b642 +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f69ab58c2b526ba463f057a76969d64304673686 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea443f764e9587cf16e0f18b4523ed946ee20980e31283ef3e533ecc23f478cd +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2735db03428f895d41f668e14d15bb66fecfaa14 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d6f06abf1f66efb4af9041195a57953a1af8a1e7541a1a3b2b11ff9de67725d +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9af1b04474499385eae850e9a083d96da4ca397e --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:173a395eb2125d27de48abd3b3e9097a0d64b618ca8a6a60a13e1989a46b6646 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cfb4a6e0b705197df3380dc8bbb33e3cfdb7c93 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be1245bfd02089084adfe47ee7865c1b169154d4b1912e49f5c6dcb720307bc3 +size 51395351 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc7cf9c41e56082553755bcb35027cdf60ee3f23 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62ed63245c4a6fbece3dad724624855495cc269387ceb122e29d604c546c0c9b +size 51395554 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61ce02f6963b9f84bfebe30bb0de71105de469d6 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f64031b75ba354d164502ce37e920b3927a496659a27b426d6f79f4b7ea425b8 +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0c9747384fdd0845de02832eba519c2197eadf6 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77dceec99a46214f980e7eb3b13cc2d27d1f123a6618339b2dcd1716899ecb09 +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66888cec28176fd0d87b8a933ab0d58391f62edc --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d0ffcc857e9e8ebab2ba7197bbde5c5ba3ed5de555ddecb697718c4c3da64f6 +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd2e726378056eab164d4344dfbe7a5e601acae8 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab9c3a9b280b959212b063b1e1fbcb021bec3d0d6e7561f6ee15ab02fb4c3ab5 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7359818892ae76735e2ba56f0a0a1d445021ebe2 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5f355f9f33bd1bc58ba668dcd97ed04a736eb50b070957ce3954001e3226dec +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb824619335b91dac1c34de84c954f289f515740 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80d41a1fd7faa73d4acc9fbae88a6e1d0ef9d329ba012720b4b3a88bfbfec042 +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2ea920cede53a6774531db6e558866209c8c3de --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8edc34b465464d21043d8111e3b3df91ce6db00f8bc0ef6a5b4f67afe839f759 +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25a3c4a90b527844ed8a3ba1f5f424b6486adc6d --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c5dc4ebb1d4eb72356a90ca8dfd6780f31c265f1256b1252e870a22a7cd33e6 +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e6f2c87e164a8ce6dcb35d43f7d91b10f8b4f58 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b1d9341731c60fc317437a07e4ffccade3fb0a2833b6739d2a983ae8b8da2e6 +size 51395554 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34f448b1d5932bb33b10deedcf3f70b75e459e8b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90dccc136e32d5bb57887e74410a7d4fd0263ca3b8aaf6f9157b64005fc11f29 +size 51395415 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eba46416a8b2419202178fc990fa4cd287ac7a47 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bae03474523d9f27d9ab28146c5fa135fdd6f22b5a311dd9a4e6d81d795cb058 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b369d5dfb98005b6ba4388bbe2f2ce860f58039 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e72e38a23d1517c8fc2f8d54db682e7d5cb1a079a067c4a210c4d553e3f79ea1 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c6abee3ed1630c144d588a76c201061162f5671 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ebe50450b6c9f291cb95d805a5db4b4dec662954533a794d0a56818f014d8a +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3ecbdc3c64d930816eca90b8c4f406984e40082 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a37904733fd204f813a2875aa7fce120200fa9d064cedf30f152647cd85561e +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..051c1e7b09dd21587d9bbd2c0f888a9fb26a1d90 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1a40143a38e09904ce07dd62bedcfa5b3bb200c04656fc432722263f5d48336 +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0889b2b41204d517d6bfc838ee16810132f15960 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:421068ab459d71714b50aac80cb1cbfddea5b8011bf07f8cf9093252a3df2f26 +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f87e5367d94a37858d97b4a72d4ccbc3854f5ef --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae8ebb2fba357b03db74d9d639abdde0999815b02219566265e7d20cb4544e9f +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29ee626f640304725a208a3a7a25f5b7616dc853 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb962f3a7e82dfd3dd86026d3bf0894c48b84deb9d8f9b05d34089c0edc4536c +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d3e961064e3d02025c09cba111b54572db87d1f --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c670c7f2b069006dfdfcfbbddca1b829927eba84c3719ca24bfee74698bb349f +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5cecbb5466854bbad4ef61864156e1079fe710e --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89abbe1a3ab83812f753dc29778be332128975147f886c7803a5893e70f0a18b +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c95e423d5380d0ffacac67819a0b8ef981f7e858 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6ad2d8c9196f349761c2faae4cb13dd7fd9e4bd7f01993b377f13fcdd87f460 +size 51395415 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26fc9a95f960710d16a68b5e1142b5a57cc95415 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a631fd04728dd7e9f7284194a0edaa87a1094813266f386e0db8564aa33071e5 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6b9b1128a693d2d17d86a2fcfe03125997e7a8c --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddd00510b029ba6ee8701839a85aa15d873c04540f9e64d8bd7caf4cc47ff64a +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6782e51b799ca4cf90ecdf747ca1cfc7e32a1f1a --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e30d3cc1cb82f11275d73eee07457437bf050a23d19876b5367949e75cd914d5 +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..898e3561f4ff52581d6171245e62bf591f756790 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c3db4e0368064703d961b8bf2822dcbca326238e9c3469ceaf5932a92e5ccc5 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcc400a8fe0a52dd362b5c2c98cb614b06be1286 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08357aee38c466381fefd669ee07238681aa15416c179123a7d8a3c3fbdf1ca1 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93c778c6e9515aab8ce929a8f485edd84905b849 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e95a12af4ff8c69ad2339638e92611d92f16f921c79b0fb2246137d19091d94 +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ead8d873791cae088f5bbf77e78fc212e94f0710 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be75c01fbc1e21de50981ebc6178b660b748b34ec3100a3fe4d038ed45f1ef6c +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d108bee621943127d36ce0de305898afe60aeec --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2edbefed950087f6842d7eeada43b936ad10e3f30db65cdcddc93dee71dbb8cd +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb680d3512cb384e286eac1c64e34ee06f120200 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:683635279a476694417f4e565d4940f58cc96a4434d35d9563629c5879d111ae +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed042e8efa70ca24e5982e8ad42001cd98da48aa --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ec7c47bb9cd7b21fecae5f27ddddc912aa62bb7d3ee89b7ade36180547c1ae0 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f452e8a98fb693c2dfd3108eccfe0770190cd452 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bbed771a2b5c5e14c165f817f0742aa46bdbb6ebdfa93fdf4b72fea1b9ed6fd +size 51395415 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d87bb3b0f64d0308c34291103baf072dd42074e9 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d287348f5ba3bf3d177ecd109db5be94e6aed75a376af6e841e782756db8ea95 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d59ebadb851d6fb100114239b39449e0b12d8eff --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2428bfdad991190cf79ed85b8a1569f1beefc60805dc4ac49bef5aa166865785 +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54ecc4ef478a4c06e1749d347fa73096a2aec1f9 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab602c4be5d700bec011f839caa9c60f740509005d02e5c916899cfdc13380a4 +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa9b0b7567d8979aa4b6e990db14c6f5a58b7226 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6c0be3c1fa6672626f2d545ae734bd4669f714e74bb59110b6a79a405201058 +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..494e45c823977dd9dad2c642d7c1c20b1e691407 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80fc4c570feb3a18511eebf950c2776823e72ca3e6f37b6795ddc14bef99c7c5 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a22029d428a1a0e037c68b6f3cdee1b4372101f9 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f7e186eff525b34e29e9fecff992206104ad215908ba5c39456e8acf1563a4f +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7366f705aea875d9830f1a9eeb11a7ae61f757ff --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49d6e2b4e12d6ea36333b9d4b6838757a764f672a2455c8970000e832cbd8c54 +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a622a81d6dbe971bda785c927185dce3397551d8 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb6740f33862d7683b41a1ec9154c493981926bfbc0204261e1164cf0c1c64a4 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e977ade19943fe2d75e7d43909e8cbda44952e09 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:439211bea248d74bdd31b90c5068be1448b076fd0961f26d0125185f0829296d +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34a0d5a4082b3cd39585dfbfbcc63a728bb2e4ef --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5728ba9e9f8ae7e6eb1e546c076080c5ec37cebdc328d41ec7340dcb6014c4c4 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8173f78d256e94ab274671a105c6a3604d154c13 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc9600b810b8aef7d3355d33dd16a2dac9213f0b90022ef0d75ef175b62498af +size 51395479 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f80df2de94b0266e38b8c484acf811cd539b36e5 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60044c2262444c268c6bac9efbb503cf9be8fa0d66213df1a63cca37a274f6ac +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71e3af4beab88bb1e5eaaaea901007450f149970 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c426edafc53ad097746ec4386cfa1f4fcd74f6ba2cbc2da4224fa74e3e391c58 +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dda962a0ef6e128d5e2bf414fb75fc2bac8dd7b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95db1faa66005b809468dc2e0286609132871ee9cc2e210667bab9026c670c9e +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5f941404a9285dd1aa9105109574d0e409a9e5f --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:281329a4c1305cd3b5a77e9c598ee3910d8241252633c5797eb5cc3f14098dee +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7a635a77b1cb2cfcae3c09e6ad1e0e5294a7573 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a62fb69b709ff9c3563ed166c44b82c9d6f48667718bb159fcadfd4df2f0af8e +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab59106ac5d38c61b1c34d10c74e559eda47138e --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98209691c03d65f62b883509bf320dbad9f2a3ff229d67716f0facc9b26c7221 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14546e26021fa27f5e5649ffc7065355d6d5e40a --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b845a22ed68b4a2d931e0d8e5b0419e7c379d003d86758a370225c344137c4a0 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f67746bc13e363f23dd947ed7f6004b2679b7288 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02c1b3e3df406b1718b1a48b220a97d290cb249e157e42192632ed57cc2743fa +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aeb1a7ba6c806b0f74a75978d81d79a384f13af --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c742af5e349018179cbc7f59f7b1cae885515d64d19e9366ab600deb5d34f5 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da376e989dbf5453bf79d5b46f57420adf7fbc6e --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfb14bbae2c93eec99aa453f3a3367b5b53e9c216e925787e6fc0de2baccfa7c +size 51395554 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e77047bd55ec1172a04b1692b66c86af1ae048d0 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c5c9f98195285683c1441586cafe8a71e83adb20263313e8cb3a97b783ab873 +size 51395351 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d74e771d692a6234a7862d79ad360dcbb4a349dd --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adc36877193c2678ec5d97b2f3e8061df98f0a1bddae0443a953dac20e93a6a7 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa36505e5a0f691e58cbf9f20a06bf83a50769ec --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abc0518ee38259e1d842e6812904c6b3aa7180d08a7dbf1d61b82faf1723bfd7 +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..990b07c5a749d4a8cb16a27efdb568bf5a912109 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc234a3796db54db3e22a803198cdb434eea8d28d4e97253f4cc22c09d7b2bad +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36a934fe28ea422cc848c2207fb4ad7fc13f39b2 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efc9940601487ec520e2c63bf3400d8858b171400cb82f198da0b1988e28820f +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbc3d6b20521b3da791c68caccf9910bf42a6859 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e715c9047c7794b4b953ff4fea490a3e63f1b5791590d29c8a82c10def41e22 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0c98324f564aeffa72f3ece9ef40c431f84cf6c --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e63338210211dc0350856bf594656ac186ed22761c4cf9673ced652b93d3af16 +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..659e3ea424e57c7bc094ef17f766fed3d31036d2 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1f6726436d5b1705444153847b48a6d561771f5fa96fde579c4bb0005baf699 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c6ebdd076a406833a0733c5a88de9738c56bb6e --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d9741ada89a4727a51b400ab3ed3a889680ac74a59b261edd7b664dd98efb7b +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41159c958a402e2e5df4a20d9f9c43dedfc90025 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0af43458366fb55b98e1b92a3877a36488e7162675c085b595c410dad4f6efb7 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e47d1a2814348372dc1132e774a7047358ddcdfc --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fdd3f0496a79dbaea4921bf45ae4f13bc9a4a679dfbb490ab9d3d5e78c67c25 +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4db2f1435774a413a4ea7e9970d5b5253feef07f --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50407af128fb1fa4bb0a1a553fe52cefaa01a5f4e4208ec8eded2b5bc3291072 +size 51395351 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4dc50705ec3c8073192583129bfb688c5951cee --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d295d9728f759f30ccf8988d4bd2b8803eb04ec58459d980bdd7a4da1c93bf3b +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02b6620dc3d03fecfbf917599fd58cd46a702465 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5da73fbc1c5e5500505baf1d624e8d826e09d93a1187c34b50f93f5e875cb180 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98ccd25e5179b9eec679f4388a7dca04fd3400ff --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cd18671c68b3b88b44944e7ebecce133ab2e953e631b8ce9de3867a02049963 +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd0b24a0b60d36ae15877c20050509ad8ff053b1 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d261ba5b7ea5c4898e3c496421c793a5e385e2e45ae122ff2d6665a46c4ce7b +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d22009e17976c893e5a2d62e2f99a56992c9b7b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76933ed2efddbb95ba227cd131839516851e5fdf8ee9d57d529894aaa9bf8262 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..525f595e41f76ca78b908a4621600c5b585139b3 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:389042ed966160059f994d76c69339de9598a732aec7ca263b86fab593de808f +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1950a3508191daa752db6937695aaf3bcef26a5 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:113450cf17d30723ee6575a462f1c3ef00615be1d90283f916d31365512d1d08 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ea49f4af159275935e693dcb80a9f0f30899644 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e59daac9ee91b67ae25f07ccb2981e8ce6cd06ba067ed2000f90178a42ba0bde +size 51395490 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dab78f4127a95f9cba77b524072fb2d3e3b4f011 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df8f37da65193dd384a4ea577f4f18bc08c3ccbd6e2a38e143a6832edb691139 +size 51395362 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..586b38c76ae29ff6b4e7c03d96c3f816916afcff --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d45ffe425b7e837a9796ed299e3f225ab8bc5d24e21fc14425cd7d1c3e2623c0 +size 51395426 diff --git a/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1c89fb6311642d60068488ebe642faccc8022cc --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b58ab2e30c9dedb0edf0566f6c5ab492f802ba56e7add14db811f0b8dbd98c0 +size 51395479 diff --git a/1b121b21bc4seed1/global_step39672/layer_01-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af58647635a275e2efa8f40cf9526aeb0e870d86 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc1551c16bb30efbf31583627bb7759e1d65fc8fc3c20e3ec128d083925ffa11 +size 187630851 diff --git a/1b121b21bc4seed1/global_step39672/layer_03-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5d9cdd9ebbe0d07b57589fdf1632b6585b11df9 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92733ea75db4cdaa6a7dac8bd2e309d355b98ccbcfc886960ad78ec6bc315598 +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_04-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95254bc086daf8c7e489e6548aada8629825fadd --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a94192095be5e3bd57c066cd8dab02b2e0d141aad22694cfd2164c111a7f017e +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_05-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65db0d9cb74a39102fe8c7ce3660645b3544dc5c --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b63e738f4f35fbfa23871e8c3178be3d585d99ac9dd30f9233fd7695ed6eec7 +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_06-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77c1966a39f71d414d6cda26c11db7fde26542b6 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9b8a91fd4fde0584cd16305be350b11697e1e3fbea076682b4e98bd833768c +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_07-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b07b7709484b165b52ae5d772faed89d28aa21b9 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4d17c65778f22813242006b12a2b6031fb12703bab3d21e1162997ccec23e4f +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_08-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59bd1d6da1d46b44b2bcd966d70535244ff68bab --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ff8adb9abac78ce570813d77531c780384178b9f2379a6f0c3313733d198c7a +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_09-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85360ac7ef8d96e2dcdbbc1991a39a84abfb67ef --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2f895c4d3c5157540ab59a85db8e175c8ea9bebdd223ab55c7793e58b082756 +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_10-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80d2ee69e8f0573221dea64f3c36381a42efc54b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b98d56842f1b4f98781802754d1c380a71e76230ba9202719af7c7f1d7ead0d +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_11-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9558419fa768815f1e1c28e461d0c18da50366a6 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0c4560d6826491a7ab1ce7a4b466f3aa3f61843fc963a2a8d6487900b73a487 +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_12-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a578a4d97b30f36637e69ecf12d30bec317c77d --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc11fb5ca2d52ee78212a3f72c4fd0c1d6920f178d9eb97f5a0a6515120989e8 +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_13-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92626133af0d2046814ab9acfd511f2b7e154862 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77fce7d48b7bce06d70a5539f4d8f61da7a187a2872c219613d94afa29c9e58e +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_14-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a0ad3f76a6610e2925dbd21451b2c697af84a3e --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69fc23c3c5e8dde5805b46ca806ee2a419311c241270d783202d8fa3bb350391 +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_15-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67128945bcc6537eb73cc3cea5b6d08e84023099 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39871f6aec6831002dfcdc1b069769554dd9bbbe6f33ca5aeba5441ec900b55a +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_16-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08a8d9c63c64fabce257b26029889b3f5a3e4ecb --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c5b83f4dfdac605a52d5917f1a1f278ccfff85873e71ab147ba8d48c59354ef +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_17-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80d0a60cf8886025128a40a8b155937fc88e8a0b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c267a8e4fb21f8318c3839b4a9a20ba29ef4d44fb88884fe6d9eadf4723977a3 +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_18-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a3e9c4a9ee6d55bae732d1e4b667ca0fe6953de --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3f21cfef3a649cae6ecea436b9abbf26a57f227f804eeb40519647b36271b63 +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_19-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99f082ea8cbc2094c51b111463e8d0d42eb76d45 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55e97d21bbb059eecf59553f4dc4365e1bd04c417bf22d0532af07d0c9948554 +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_20-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6af1c9d02c68640277e7080248800ac474072c7 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4588f5c3d1a407460935d7f3a8aaeb739604271bd87e916ab1f832b332e6b58f +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_21-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdb34ebb662c806eb4a748a8d0e7423c8e8394db --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f92884679adac529e012cecd603e6c8246409039516ff004c64e83d1e2fc5de +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_22-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d75eb55839382a9b594721ef8a505806aab30e14 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:652e79bdf1b7ee18508f543b8575615b7eee8f00510d6d22c88c8808612168f9 +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_23-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f58654e5ffaa85ab865509904d78b3cc9c2e72b --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10f77fceb380e3f2fdac3d1cbfe28ace113e49634e29167c31ab492ad85cea5f +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_24-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e640216c7ae17c812040204c01d7e966fc8fd957 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26eebc9a8338340e224624bbfa96556268dd99cf039d3e893412e9e795b6c61f +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_25-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f931aba2bb653cbeb85bf0e3643e7301a406f0a --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:019791639e11d378756de1fbcf7418024fdd4085d28fe0c1b944b1edd1f70604 +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_26-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..173bc6237bc19dcea1064bf41f2b53316f149667 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6376d69bc60f4e95b5f7ca97fef01cdcc58aae633874653c8cb6537d4d6f3ef1 +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_27-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35cd50ff3d51bbb78c7614aa1879314d127f0b3c --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:284801ec5ca98aba27b73c0cba5064ad8904566d9e1f67eded8c142bed9ca319 +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_28-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03d3a8d58c4f013d55fbb9cc955840cbc518eedf --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f5beb4111d47a241b716256cc97551dac4ffeb3ec3f5cbb6aaba322f83f6625 +size 77121283 diff --git a/1b121b21bc4seed1/global_step39672/layer_30-model_00-model_states.pt b/1b121b21bc4seed1/global_step39672/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bc6513599566dce1698271c4e0665594563885a --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:431c535f010c326f7ac95e91725ec7516f670292ce48284664d89705ac260443 +size 8387 diff --git a/1b121b21bc4seed1/global_step39672/mp_rank_00_model_states.pt b/1b121b21bc4seed1/global_step39672/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b095ac823fe683ae4fae95eca4e7a068d94832f9 --- /dev/null +++ b/1b121b21bc4seed1/global_step39672/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79017efc1dbc98681caee2c2dbf5aad92ad7ba4b3175fa4836317290fbe1b215 +size 43827 diff --git a/1b121b21bc4seed1/transformers/config.json b/1b121b21bc4seed1/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7120acb75187622c061f0425674b658dd9155502 --- /dev/null +++ b/1b121b21bc4seed1/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50304, "n_positions": 2048, "n_embd": 1792, "n_layer": 26, "n_head": 14, "n_inner": 7168, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/1b121b21bc4seed1/transformers/pytorch_model.bin b/1b121b21bc4seed1/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..32a012ca0bcdef2a0ce5d800a5f9437b141bb20f --- /dev/null +++ b/1b121b21bc4seed1/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:908ab4297936164e84df1dceaaa4a4a1d1e235d1d9cb3863e02cd4db3b0337d4 +size 2410895501 diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..43aeffb512637a1f0cefd6ddf5aef54f947573b4 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.2850756553878694, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.029479244787540198}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06307795392559021, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018961573476995012}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2519437334576553, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0046233665666279115}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09250286063498843, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021321582297043904}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.031169579486007647, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013315121763508673}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.12406823641780289, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003056908408498049}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.044919822948790884, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013419119538143087}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.060512962960882884, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017532071667563402}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.24591537295391636, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004506544617650046}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08915644889918124, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019635255248017934}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.060137684271610675, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017836800848927256}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.24092589731633912, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004306266650112688}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.0881964727255614, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00197619826433602}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1d1e0cd304bd6cec353be7759b24442743baaa8f --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.24801641089701984, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.011989470193668068}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.05818517766037036, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014819995423263183}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2827362020383282, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00480569342082808}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.08959675554256848, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018375399876627346}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.02635367956564326, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009528048262941789}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.12704223429697128, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0030597437559013066}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04016977243576677, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011455508827807554}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05484150466192377, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001315703805718461}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2667301815318325, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004372221951900707}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08471881476079753, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016703735129750064}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.055740125805322414, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014190378903881072}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.26919922518521233, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004429470047755656}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.08576130624221133, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017402119865819162}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..c4ea9b7dacc13f469fb1e0d17af2d0fd11d754bd --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.2530185878500052, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.012040289243788763}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.058512763074349945, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001317655981799918}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.28742836834463886, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004669386290992104}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09138094990191768, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001796675120671757}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.02660128395309018, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007990003962669926}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.13371012137028607, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003130626897597201}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.041518797800848606, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011144817093188633}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05542859482898103, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011932242274819006}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2719360787885418, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0042608863041157016}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08671939835151828, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016448408963673205}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.056182111716967645, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001251228891614172}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2754066562262308, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004372289191944523}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.08775702388632066, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017074743673142906}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a382551f419e10746c90a0ba3c93e5775831d825 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.26104356935100076, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.020606892130089625}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.05876875730987439, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001262923124165934}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2978570511134094, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004772108557819704}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09225925338125805, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017393497174197025}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.026266986693919324, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007684696212875827}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.13694139873828265, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032263532566755484}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.041225163728007774, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010870715838513074}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05552067895103241, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011567152896671338}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.27953358851668986, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004336840965548908}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08719695353070112, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016039844889244289}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.05648619086001838, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001210169007089921}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.28427881728747934, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004454752297972069}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.08861162982557379, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016648356514252724}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..dad22c9de0cc51807bc7bd712740bceff7b11510 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.29578242700897045, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.01644855391604288}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.059241759487365105, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013185605514960156}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2941689602060997, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004782582061622861}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09236209607564469, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017155296399348975}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.026700072260856023, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008329146326999274}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.13703029324122062, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032032363310221562}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04146292001846389, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010710528467515177}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05584064201532722, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011822227694518028}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2765136016304282, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004355885247911899}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.0871975029360322, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015832095836349604}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.056809260000044604, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012651199781666866}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.28080366233461934, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004447560399921803}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.08849785197136012, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001631762057927943}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..0f2851b7de52553a769ef4de0a4b0767ef738a36 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3072581712947307, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.013011180740751221}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.05956004848850282, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0011844820103012758}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3050141575766028, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004806860152049065}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09385006352878718, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016492746708198635}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.02671744686752806, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007193199514761142}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1433762159365779, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003204965724880526}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04219069561770858, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010275629961263655}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.056371808160412054, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011227434161722896}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.28550365697556257, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004319358585933794}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08869899339649662, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015565597321756607}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.057099278638911184, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001138102224001842}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2910079263017007, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0044961239015304435}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.08990792464666136, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015790820849768395}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..3749eba3f2eb84611fa4c30b2a2be167a6428922 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.13418128757490422, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019073144542996227}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.22370464176226834, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002611499109099858}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1561377606426544, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018912371468179697}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.025327472863282418, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007106910143569577}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04305842511949861, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012262998119789712}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.029464599857488446, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007789826555536276}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10545228491836044, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001352449912251029}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1823578443380979, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002113773481771066}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12424387461861276, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00136977188181699}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.12317282152669443, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001738142219855923}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.20632202845312703, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002412292367994964}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.143508075517125, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017239605017566344}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.321761515529462, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06405890291232123}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1964f2ffec31c1388c625e9873ba0a641b4fa50d --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.14320491367082974, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017845301991567476}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.24137867619505146, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025607829167710225}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.16584774157614826, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00170618534117368}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.024138151973368126, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006642056284954163}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04339348127802618, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0013577106434495858}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.028239833468568194, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000742179114763329}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10239786671559123, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011893616487463725}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.17945313333907692, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.001974005906098066}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1198532739033359, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001127314183736604}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1340667845076243, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001657309035299111}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2269067249445735, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024213993165733594}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15540160642759504, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015831136631871156}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.3666198009021433, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02548342731902}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d381c02faafed5edcf4c832acdee9e9760e93ae0 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1458694998331044, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020751465219441393}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.23221929546910855, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0024940559594616818}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.16273042831855172, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001775802427873928}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.026699811383133716, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009124914873931906}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04136532269717438, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011921194612908434}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.028547689348404154, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007464823189898568}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10982415140479714, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015215433681870106}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.18026503948966904, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0019465654580408404}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12326647530268532, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012253014530928786}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13660282396539003, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0019561376555209675}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.21773728025312808, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023396514300470118}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15222819626322362, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016446268586332612}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.330687803868559, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05809493878615601}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..25bd6decc04599387038e24f0e72064875ffaab8 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1301446922879572, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0023453140077651403}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.192560590973123, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002831737470965657}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.13727972794632332, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001966418255252875}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.024524184294746752, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009475897993583641}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.036259772750247096, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012047403068686847}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.025265129695390083, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007420512125640625}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10008927585037762, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017992649861688023}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1516749369666555, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022484203739687827}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.10580900761306217, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001429843686104546}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.12168486458438436, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002209541457640191}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.18040752843563596, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026623601517320387}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.12824788953769048, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018235330304926663}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.4859120479096923, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05574241192906709}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..c2bbd2da0d8fb66726babf2e37a426ea8934ce22 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.04687267447236592, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018998335960580418}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.07098562737132999, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025626429489145814}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.0482938559604652, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017050539428373885}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.00945752327909291, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006557120452244116}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.01524147181315175, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.000968063791685238}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.00992332936384645, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005483941828877055}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.03658048025111141, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014765804478846238}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.056879968483736575, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020708799931085835}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.03777472015184596, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012944979133275166}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.04364094827472193, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017744092995215651}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.06599052444685644, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023914383468420387}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.04480769496337831, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015770553891978325}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.38983093510263966, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.020746959439040737}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..346aa84ceff4ccd96c83d7ccd4ffb6c2a11cd152 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.007899778364305632, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008374134090368952}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.011343564720969444, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0011277127148891929}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.007816345912784222, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0007612291694346548}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0016948351052204623, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00025208432207753475}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.002630687274039701, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0004138243186705428}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0017575740188721435, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00024992892095104455}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.006320389859749812, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006593125172728464}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.009415721615635371, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0009461004389786301}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006339645540807284, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006142715904854269}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.007348127779079044, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007820257098133964}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.01039809783113184, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0010181220364392032}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.007195583841595385, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0006939813114362923}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 6.848753994158733e-07, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.2091205071113564e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d4ff1a10a53d5222172bf8d968d2b194e20ebddf --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.008438122208283742, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.001197050519804994}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.01731813417190785, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0006904015455150221}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.008140031462486316, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0003341464417431424}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.010852991398846181, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00043603376914659093}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.0, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.0, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.0, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.016290356394130068, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006344252881163902}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.0076944580577918845, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00031179286190496404}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.010236948851681334, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00040376061853106}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.017040356394130075, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0006757816435795186}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.008014275466220572, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0003277471469197949}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.010681172391084869, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0004270222110231445}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..5bbb74be81c1b762c2b7c806c2582d08b38a8595 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.415302314455357, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08866274485975845}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.27518284278158495, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026904123485453207}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.44395987313972773, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002853052677955519}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.31351772873404504, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019155579544317606}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.11779839983589596, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0022522445004712227}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.184152221066327, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002022505610836659}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.1270592371269382, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013298949590436037}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2142971565592026, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0023228065282473727}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3473102442580568, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023084199885264082}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.24261441305411593, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013732549831421876}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.23044400536893825, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0025590767181566617}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3694044441017418, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026884487723429907}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2604729426900251, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001783692486265605}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..19f38dba497ec392abf705e558f6d737a4f24cb9 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.0835515625006265, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.13104580918021916}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.2974677905788029, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0027133762420868996}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.46824453868512245, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027816673096099764}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.33900310160818814, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001977319155178536}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.12852946982374805, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001751970024964452}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2045106938957861, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002085524555577239}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.14523171565764664, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014456847848380934}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.22768892967881724, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002087880547521337}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.36418502101759054, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002325817522071071}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.26089415735825394, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015092210279407214}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2475565846991815, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0024501420067594773}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3901821108140583, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002708125972473242}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2819640732417153, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019029624581531216}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ddcbaceefeb1a7a9cda9bad13cd3af284ca80e89 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.191081522703311, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08272180666976954}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3059304522321104, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0027936595692492597}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4706742638622414, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027940064831602895}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.34451701581346555, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019917632496230047}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.13437401439677085, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017741938204701253}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2092379893021306, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002098339038549269}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.15040030282166134, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014742918695484102}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.23044883331819338, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0021248657249371234}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.360559914434991, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023451576403232576}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.26101746069946474, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00152874420852884}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2535539353339795, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002458411594898136}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3921926325740904, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002706349636318779}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.28608327236106273, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018907928361422866}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..9b43ab44450efd9c857fcc2579145841329ba4a1 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.111226061397375, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09062441129980986}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.30328161795682607, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002708454817254866}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4688958080821436, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002671021101118256}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.34431019911907407, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019747182058236588}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.13386033868102898, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001714165558168862}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2086704107913658, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020408838673953386}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.15099725848090637, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014686203885590958}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.22638671811775446, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0020039774183955566}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.35756636848528994, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002297633308443435}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2590550585031971, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001502995830389098}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2504271029683134, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0023554702511328304}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.39039800395209395, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002657711797112865}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2853836607666494, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001891594019521224}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..5d25939eb68e18f9cd0597d2eb1e046e837615c3 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.157356980483942, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07864334022914665}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.30466283281999534, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0025978328638333616}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4773039407134765, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002664398147764323}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.35051512109030886, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019782779391466078}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.13400973384465575, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0016288510201777058}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21289488423428288, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002000085706195211}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.15368403663923805, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014239556304565032}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.22385070378222516, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019273938628042813}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3574082439802802, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002275515159936868}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.25918799434536877, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015032561739134625}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2535442923717527, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0022917134606788734}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.39929532049271077, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002600651131060951}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2922680755704595, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018749054110706917}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_0.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..7975631db45b436b2ea0d76326c47b15ff08d5ee --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.13501905286560467, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017190548809381608}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3283241072423947, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0038525710180174508}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.18901821549901887, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002279829129106952}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02615731107536162, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008966873086018211}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06575913031162332, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002266591287149122}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03695459182313156, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012557792366904089}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1027427586819049, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001244941572662973}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.252046388299858, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002947806442204036}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14412588822347172, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016582568651692159}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10624155578857983, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001424582628324823}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.26000319990620885, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0033470003654420873}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14899415385858006, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019181750290880519}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.3129317790470016, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07760065268118045}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_1.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..562987ee8a1e6d669a0394101fcdabb80c34caa9 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.10785786524836369, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00166393179985334}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.26764764317740486, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003811737165493939}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.15187372372759875, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002238363045234264}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.016853649910436037, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007934380254041366}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.04266671919641135, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020332253461267506}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.023861206597580405, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011166771493325116}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0850737564631199, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001231208254663744}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.21291139183497299, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0029192691827101673}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.12003447267920726, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016620315126572962}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.08614064999564035, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013137573398773557}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.21627422684982414, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0031741815045650216}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.12165528120740891, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001786850495717495}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.9224414632472534, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08019869073111606}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_2.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2faa432f2818e7b7c94780dfb522225b0e4941eb --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1062226714370173, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0016313647653793566}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2649518628728813, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003652381902131823}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.14992707811107275, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021846261144537115}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.01588044344088591, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007537881734122496}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.04053986486635946, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019391443831652793}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.022554691732547677, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010629952996922107}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08432740681651495, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011919454883656977}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.21219568397714195, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00280778428980714}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.11929556728475006, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016092633921978442}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.08362060554920302, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012757122592231506}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.21114568653248753, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003020669313336447}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.11841507440799803, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017311352559642463}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.7849705282265558, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05021581187998352}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_3.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a8dad4f5fa7ad152b5198c68b8ef950b466a19e3 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.10057846011875604, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018497294107205577}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.23942926779906215, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003842497556321712}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.13810451001882001, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022714225587039667}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.014408897494360922, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007527082518367464}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.035145702586454476, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0018205243537310583}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.019896507185675868, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010117990051707437}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08102526691338699, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014626039759259395}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.19354330349683008, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0029953557840955284}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.11124617587091595, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017443372993626053}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0803671735666726, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015024060943462886}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.1928976711119303, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003150396864481297}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.11048932831500144, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018170680342048896}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.7190258437509995, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.042187577531458346}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_4.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..6bee75181788102bea44e090501553b28744835b --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.03173204900268027, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002027826208658339}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.05989088557122078, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0034559892001691417}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.03779629267333967, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002174444567033052}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.004425484224867963, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000643504684134592}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.008676763065921654, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0009869539677775623}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.005239892494254664, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005866501971322619}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.025562577011753043, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016557292706477333}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.04810137820818986, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002762103216085477}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.030163301894705917, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017082556309796733}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.026108776067360468, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017169750619199886}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.04912097715557878, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002853073868806013}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.030777834462545225, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017676759430837576}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.32351273593768703, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08540381984004876}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_5.json b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..7db34078faf202aa95391140cb59ed0ca133ab5e --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/agg.1b121b21bc4seed2_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0028066473138469166, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008207012823296872}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0020864639544280125, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0005806543667432164}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.002313684367811786, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0006507326736497126}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.00023749835070589783, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0001188407936767355}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0001673483748955447, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 8.57618183045581e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.00019304594776292888, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 9.705711124778186e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0019047789901811747, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0005159501799768975}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0015276752695243573, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0004218946829627963}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.001631869743854381, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00043610635442712287}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.002236816201562974, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0006238629929594013}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0017355764056056515, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0004749539743411232}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0018840090143813742, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0005098533594631085}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.0347712018500012e-39, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.5407113142608347e-34}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ca8a5e69264774f0ba2b3de720adef65eb00a7d6 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a39bba0b67bb4a9f29c8cea0150fe39ef4f55ea9a334ee25c4b7a3a971c834eb +size 4182062 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b988fb7ba9687468564fc174efe27deec2ee9c14 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97a41c6a892430876e3296868e4bbf2db181e4a0462975c63ba61cb86d6dfe31 +size 5171912 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..479ccebb1587a25191f7d5488ef23083c1d50f44 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:162d61d3a2df7de283deea9bcccd47db8b7d846d99114699bb9c6abcdc3aef44 +size 6067812 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..66de2a02af954999265499a3474564445d5ce2b3 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0a4ec199df470ada4004c846f28fe14f24d070264c84fcba1eb3d818498e861 +size 6974955 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4a39f2cf33091851cc77a5dfb458dac36d073443 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af8db29c70d17978e3a66bcbf19e1ceb517f8220af0ae058ddc64291f49b1181 +size 7853913 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..25e049c72775392e36342d1502927024788c430a --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26b08f4ec2138cf169fdc8bdc31ada05163e5dada42ee05035fc7f336a721f5c +size 8763779 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e0c68ba929f0b4d1e94410c0d4601a7322ad3725 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26868daca1fecba332241447c0bcdf3b728e8ae649de75c15eac1794978c5b02 +size 7676184 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..78a866c2c0e21dc73bbcb4c62c8e50c52a384796 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ef41c443670d00f141b274114c4492238f07c192701078b89c489d1ca96a8a6 +size 13335183 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8620c769f61f0900b6499bbcacd3f61784665f92 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e5ef46ce8e42a64324298c1ffbf9a98bbefba121d60e366bb7b669b928df2ea +size 18920797 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e0d5b13d9c9d9023d17ce0cfe059e6cf8a6f1189 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50e209a242525db3803d9bb2251a76ead4646890d2e174cf083a69565d96c95c +size 24331002 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f43e504623c8aed3af5812cedc59238d40a1f781 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf35bf043055b28d37b798f2b7c2667f4609744efa19a08f5a030507d7d1b6cb +size 29471521 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5f6f54a9f8c9360c15ba8ff78c70b002cd469fe8 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8afb1020f3640c933a81b4fe1e25d6839569afd8697ea6be709eac0ee4f5d91 +size 34799763 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3f22044181b69c6f08ff917fad1e8be98892ee1f --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3856a7ca00ab60778cb270eb0fffdd055c5e51b5c7a683fc2861e2bffbbb0e71 +size 3788642 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..84ca6e98e6868837224cac3e6fa3faeb728cb27a --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dbb4774f03a2d6576ae121830ec246451752a4d444649c4bf2bf2c5a145fee9 +size 5449866 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fe21a7f0200163f778a2165fcbaf5c8211378aa0 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef25a34e2d13019d4f93bd99900166e08f22917be1f85713f449c548007c5d7d +size 6516270 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..86917f3ab99768756541fe68ad8113ca714ab2a0 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a86673ba460c2bcb01585e91fc05ac6e55a9d14dd439d3df35e32b0387b7a152 +size 7586916 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4338eb1e0be7af33be85f921362f73cf4b4fd0bf --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90ccc856ef05bb10d40c02629ae15c256d28ad6ae54a5ffb8a25e777a1955901 +size 8668769 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e1b455aa9b549c63843e54e303286de9dde17f49 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c369fb3554c709e23358357eb0029508c94092563b272f33c84d941fb9f8128e +size 9756444 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_0.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7af6047f701d2827c31c94d801168f71630bd0f6 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3accb7bdd25c7297f2e25d611e577235d357042b0d0289e7e77754400a77b353 +size 2837239 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_1.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a7276535a4c2a57145a83243cfedf96c86a780a6 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de61ec372f8af4fe62ae23729a6d3097145fcd2615316e8395304f9995efb647 +size 5104445 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_2.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b4db0bee1aa14163424d3fb3d002106f857b8471 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f2ee939e9ec84452c8e9aba9757aebf345808c0d7bf9bc4ebd67d4b7d83186d +size 7379892 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_3.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..798ec1205369d6243e5a7fb1b909e7b2c37a4eac --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dd8efa69acdc495db372877c71cb2469a2211c4c90ac4f7e773987089150885 +size 9645767 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_4.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..28be6d77b9f8e638d2d7a15e36124e1370f04ae7 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf99117ea1193e629d61926ba75621d399045feff9e55b087dcbd7fdbab0c566 +size 11672533 diff --git a/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_5.jsonl b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3fdd532ca1ec0d88f66fca9cc4bc72375795cc2e --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/examples.1b121b21bc4seed2_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46cdf70d7a274e9271dd5c7c9475c062e124dadfc6d9c8158cb5269a878c1adc +size 13897425 diff --git a/1b121b21bc4seed2/evaluation/generation/merged.csv b/1b121b21bc4seed2/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..c43e7f3e0405a91aec70d93bf4be7e847cd7286d --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.0 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.0 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.1270592371269382 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.1270592371269382 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.14523171565764664 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.14523171565764664 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.15040030282166134 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.15040030282166134 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.15099725848090637 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.15099725848090637 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.15368403663923805 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.15368403663923805 +e2e_nlg_cleaned,5,average,multiple,0.12122875845439843 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.03695459182313156 +gem_xsum,0,median,rouge2_fmeasure,0.03695459182313156 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.023861206597580405 +gem_xsum,1,median,rouge2_fmeasure,0.023861206597580405 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.022554691732547677 +gem_xsum,2,median,rouge2_fmeasure,0.022554691732547677 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.019896507185675868 +gem_xsum,3,median,rouge2_fmeasure,0.019896507185675868 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.005239892494254664 +gem_xsum,4,median,rouge2_fmeasure,0.005239892494254664 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.00019304594776292888 +gem_xsum,5,median,rouge2_fmeasure,0.00019304594776292888 +gem_xsum,5,average,multiple,0.018116655963492184 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.044919822948790884 +web_nlg_en,0,median,rouge2_fmeasure,0.044919822948790884 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.04016977243576677 +web_nlg_en,1,median,rouge2_fmeasure,0.04016977243576677 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.041518797800848606 +web_nlg_en,2,median,rouge2_fmeasure,0.041518797800848606 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.041225163728007774 +web_nlg_en,3,median,rouge2_fmeasure,0.041225163728007774 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.04146292001846389 +web_nlg_en,4,median,rouge2_fmeasure,0.04146292001846389 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.04219069561770858 +web_nlg_en,5,median,rouge2_fmeasure,0.04219069561770858 +web_nlg_en,5,average,multiple,0.041914528758264416 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.029464599857488446 +wiki_lingua_en,0,median,rouge2_fmeasure,0.029464599857488446 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.028239833468568194 +wiki_lingua_en,1,median,rouge2_fmeasure,0.028239833468568194 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.028547689348404154 +wiki_lingua_en,2,median,rouge2_fmeasure,0.028547689348404154 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.025265129695390083 +wiki_lingua_en,3,median,rouge2_fmeasure,0.025265129695390083 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.00992332936384645 +wiki_lingua_en,4,median,rouge2_fmeasure,0.00992332936384645 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0017575740188721435 +wiki_lingua_en,5,median,rouge2_fmeasure,0.0017575740188721435 +wiki_lingua_en,5,average,multiple,0.020533025958761577 diff --git a/1b121b21bc4seed2/evaluation/generation/merged.json b/1b121b21bc4seed2/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..ff35fb1fbaa5c05322892fde855d2b64da3f2a5e --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.2850756553878694, "bleu_stderr": 0.029479244787540198, "rouge1_fmeasure": 0.09250286063498843, "rouge1_fmeasure_stderr": 0.0021321582297043904, "rouge1_precision": 0.06307795392559021, "rouge1_precision_stderr": 0.0018961573476995012, "rouge1_recall": 0.2519437334576553, "rouge1_recall_stderr": 0.0046233665666279115, "rouge2_fmeasure": 0.044919822948790884, "rouge2_fmeasure_stderr": 0.0013419119538143087, "rouge2_precision": 0.031169579486007647, "rouge2_precision_stderr": 0.0013315121763508673, "rouge2_recall": 0.12406823641780289, "rouge2_recall_stderr": 0.003056908408498049, "rougeL_fmeasure": 0.08915644889918124, "rougeL_fmeasure_stderr": 0.0019635255248017934, "rougeL_precision": 0.060512962960882884, "rougeL_precision_stderr": 0.0017532071667563402, "rougeL_recall": 0.24591537295391636, "rougeL_recall_stderr": 0.004506544617650046, "rougeLsum_fmeasure": 0.0881964727255614, "rougeLsum_fmeasure_stderr": 0.00197619826433602, "rougeLsum_precision": 0.060137684271610675, "rougeLsum_precision_stderr": 0.0017836800848927256, "rougeLsum_recall": 0.24092589731633912, "rougeLsum_recall_stderr": 0.004306266650112688}}, "1": {"PALM_prompt": {"bleu": 0.24801641089701984, "bleu_stderr": 0.011989470193668068, "rouge1_fmeasure": 0.08959675554256848, "rouge1_fmeasure_stderr": 0.0018375399876627346, "rouge1_precision": 0.05818517766037036, "rouge1_precision_stderr": 0.0014819995423263183, "rouge1_recall": 0.2827362020383282, "rouge1_recall_stderr": 0.00480569342082808, "rouge2_fmeasure": 0.04016977243576677, "rouge2_fmeasure_stderr": 0.0011455508827807554, "rouge2_precision": 0.02635367956564326, "rouge2_precision_stderr": 0.0009528048262941789, "rouge2_recall": 0.12704223429697128, "rouge2_recall_stderr": 0.0030597437559013066, "rougeL_fmeasure": 0.08471881476079753, "rougeL_fmeasure_stderr": 0.0016703735129750064, "rougeL_precision": 0.05484150466192377, "rougeL_precision_stderr": 0.001315703805718461, "rougeL_recall": 0.2667301815318325, "rougeL_recall_stderr": 0.004372221951900707, "rougeLsum_fmeasure": 0.08576130624221133, "rougeLsum_fmeasure_stderr": 0.0017402119865819162, "rougeLsum_precision": 0.055740125805322414, "rougeLsum_precision_stderr": 0.0014190378903881072, "rougeLsum_recall": 0.26919922518521233, "rougeLsum_recall_stderr": 0.004429470047755656}}, "2": {"PALM_prompt": {"bleu": 0.2530185878500052, "bleu_stderr": 0.012040289243788763, "rouge1_fmeasure": 0.09138094990191768, "rouge1_fmeasure_stderr": 0.001796675120671757, "rouge1_precision": 0.058512763074349945, "rouge1_precision_stderr": 0.001317655981799918, "rouge1_recall": 0.28742836834463886, "rouge1_recall_stderr": 0.004669386290992104, "rouge2_fmeasure": 0.041518797800848606, "rouge2_fmeasure_stderr": 0.0011144817093188633, "rouge2_precision": 0.02660128395309018, "rouge2_precision_stderr": 0.0007990003962669926, "rouge2_recall": 0.13371012137028607, "rouge2_recall_stderr": 0.003130626897597201, "rougeL_fmeasure": 0.08671939835151828, "rougeL_fmeasure_stderr": 0.0016448408963673205, "rougeL_precision": 0.05542859482898103, "rougeL_precision_stderr": 0.0011932242274819006, "rougeL_recall": 0.2719360787885418, "rougeL_recall_stderr": 0.0042608863041157016, "rougeLsum_fmeasure": 0.08775702388632066, "rougeLsum_fmeasure_stderr": 0.0017074743673142906, "rougeLsum_precision": 0.056182111716967645, "rougeLsum_precision_stderr": 0.001251228891614172, "rougeLsum_recall": 0.2754066562262308, "rougeLsum_recall_stderr": 0.004372289191944523}}, "3": {"PALM_prompt": {"bleu": 0.26104356935100076, "bleu_stderr": 0.020606892130089625, "rouge1_fmeasure": 0.09225925338125805, "rouge1_fmeasure_stderr": 0.0017393497174197025, "rouge1_precision": 0.05876875730987439, "rouge1_precision_stderr": 0.001262923124165934, "rouge1_recall": 0.2978570511134094, "rouge1_recall_stderr": 0.004772108557819704, "rouge2_fmeasure": 0.041225163728007774, "rouge2_fmeasure_stderr": 0.0010870715838513074, "rouge2_precision": 0.026266986693919324, "rouge2_precision_stderr": 0.0007684696212875827, "rouge2_recall": 0.13694139873828265, "rouge2_recall_stderr": 0.0032263532566755484, "rougeL_fmeasure": 0.08719695353070112, "rougeL_fmeasure_stderr": 0.0016039844889244289, "rougeL_precision": 0.05552067895103241, "rougeL_precision_stderr": 0.0011567152896671338, "rougeL_recall": 0.27953358851668986, "rougeL_recall_stderr": 0.004336840965548908, "rougeLsum_fmeasure": 0.08861162982557379, "rougeLsum_fmeasure_stderr": 0.0016648356514252724, "rougeLsum_precision": 0.05648619086001838, "rougeLsum_precision_stderr": 0.001210169007089921, "rougeLsum_recall": 0.28427881728747934, "rougeLsum_recall_stderr": 0.004454752297972069}}, "4": {"PALM_prompt": {"bleu": 0.29578242700897045, "bleu_stderr": 0.01644855391604288, "rouge1_fmeasure": 0.09236209607564469, "rouge1_fmeasure_stderr": 0.0017155296399348975, "rouge1_precision": 0.059241759487365105, "rouge1_precision_stderr": 0.0013185605514960156, "rouge1_recall": 0.2941689602060997, "rouge1_recall_stderr": 0.004782582061622861, "rouge2_fmeasure": 0.04146292001846389, "rouge2_fmeasure_stderr": 0.0010710528467515177, "rouge2_precision": 0.026700072260856023, "rouge2_precision_stderr": 0.0008329146326999274, "rouge2_recall": 0.13703029324122062, "rouge2_recall_stderr": 0.0032032363310221562, "rougeL_fmeasure": 0.0871975029360322, "rougeL_fmeasure_stderr": 0.0015832095836349604, "rougeL_precision": 0.05584064201532722, "rougeL_precision_stderr": 0.0011822227694518028, "rougeL_recall": 0.2765136016304282, "rougeL_recall_stderr": 0.004355885247911899, "rougeLsum_fmeasure": 0.08849785197136012, "rougeLsum_fmeasure_stderr": 0.001631762057927943, "rougeLsum_precision": 0.056809260000044604, "rougeLsum_precision_stderr": 0.0012651199781666866, "rougeLsum_recall": 0.28080366233461934, "rougeLsum_recall_stderr": 0.004447560399921803}}, "5": {"PALM_prompt": {"bleu": 0.3072581712947307, "bleu_stderr": 0.013011180740751221, "rouge1_fmeasure": 0.09385006352878718, "rouge1_fmeasure_stderr": 0.0016492746708198635, "rouge1_precision": 0.05956004848850282, "rouge1_precision_stderr": 0.0011844820103012758, "rouge1_recall": 0.3050141575766028, "rouge1_recall_stderr": 0.004806860152049065, "rouge2_fmeasure": 0.04219069561770858, "rouge2_fmeasure_stderr": 0.0010275629961263655, "rouge2_precision": 0.02671744686752806, "rouge2_precision_stderr": 0.0007193199514761142, "rouge2_recall": 0.1433762159365779, "rouge2_recall_stderr": 0.003204965724880526, "rougeL_fmeasure": 0.08869899339649662, "rougeL_fmeasure_stderr": 0.0015565597321756607, "rougeL_precision": 0.056371808160412054, "rougeL_precision_stderr": 0.0011227434161722896, "rougeL_recall": 0.28550365697556257, "rougeL_recall_stderr": 0.004319358585933794, "rougeLsum_fmeasure": 0.08990792464666136, "rougeLsum_fmeasure_stderr": 0.0015790820849768395, "rougeLsum_precision": 0.057099278638911184, "rougeLsum_precision_stderr": 0.001138102224001842, "rougeLsum_recall": 0.2910079263017007, "rougeLsum_recall_stderr": 0.0044961239015304435}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.321761515529462, "bleu_stderr": 0.06405890291232123, "rouge1_fmeasure": 0.1561377606426544, "rouge1_fmeasure_stderr": 0.0018912371468179697, "rouge1_precision": 0.13418128757490422, "rouge1_precision_stderr": 0.0019073144542996227, "rouge1_recall": 0.22370464176226834, "rouge1_recall_stderr": 0.002611499109099858, "rouge2_fmeasure": 0.029464599857488446, "rouge2_fmeasure_stderr": 0.0007789826555536276, "rouge2_precision": 0.025327472863282418, "rouge2_precision_stderr": 0.0007106910143569577, "rouge2_recall": 0.04305842511949861, "rouge2_recall_stderr": 0.0012262998119789712, "rougeL_fmeasure": 0.12424387461861276, "rougeL_fmeasure_stderr": 0.00136977188181699, "rougeL_precision": 0.10545228491836044, "rougeL_precision_stderr": 0.001352449912251029, "rougeL_recall": 0.1823578443380979, "rougeL_recall_stderr": 0.002113773481771066, "rougeLsum_fmeasure": 0.143508075517125, "rougeLsum_fmeasure_stderr": 0.0017239605017566344, "rougeLsum_precision": 0.12317282152669443, "rougeLsum_precision_stderr": 0.001738142219855923, "rougeLsum_recall": 0.20632202845312703, "rougeLsum_recall_stderr": 0.002412292367994964}}, "1": {"tldr_en": {"bleu": 1.3666198009021433, "bleu_stderr": 0.02548342731902, "rouge1_fmeasure": 0.16584774157614826, "rouge1_fmeasure_stderr": 0.00170618534117368, "rouge1_precision": 0.14320491367082974, "rouge1_precision_stderr": 0.0017845301991567476, "rouge1_recall": 0.24137867619505146, "rouge1_recall_stderr": 0.0025607829167710225, "rouge2_fmeasure": 0.028239833468568194, "rouge2_fmeasure_stderr": 0.000742179114763329, "rouge2_precision": 0.024138151973368126, "rouge2_precision_stderr": 0.0006642056284954163, "rouge2_recall": 0.04339348127802618, "rouge2_recall_stderr": 0.0013577106434495858, "rougeL_fmeasure": 0.1198532739033359, "rougeL_fmeasure_stderr": 0.001127314183736604, "rougeL_precision": 0.10239786671559123, "rougeL_precision_stderr": 0.0011893616487463725, "rougeL_recall": 0.17945313333907692, "rougeL_recall_stderr": 0.001974005906098066, "rougeLsum_fmeasure": 0.15540160642759504, "rougeLsum_fmeasure_stderr": 0.0015831136631871156, "rougeLsum_precision": 0.1340667845076243, "rougeLsum_precision_stderr": 0.001657309035299111, "rougeLsum_recall": 0.2269067249445735, "rougeLsum_recall_stderr": 0.0024213993165733594}}, "2": {"tldr_en": {"bleu": 1.330687803868559, "bleu_stderr": 0.05809493878615601, "rouge1_fmeasure": 0.16273042831855172, "rouge1_fmeasure_stderr": 0.001775802427873928, "rouge1_precision": 0.1458694998331044, "rouge1_precision_stderr": 0.0020751465219441393, "rouge1_recall": 0.23221929546910855, "rouge1_recall_stderr": 0.0024940559594616818, "rouge2_fmeasure": 0.028547689348404154, "rouge2_fmeasure_stderr": 0.0007464823189898568, "rouge2_precision": 0.026699811383133716, "rouge2_precision_stderr": 0.0009124914873931906, "rouge2_recall": 0.04136532269717438, "rouge2_recall_stderr": 0.0011921194612908434, "rougeL_fmeasure": 0.12326647530268532, "rougeL_fmeasure_stderr": 0.0012253014530928786, "rougeL_precision": 0.10982415140479714, "rougeL_precision_stderr": 0.0015215433681870106, "rougeL_recall": 0.18026503948966904, "rougeL_recall_stderr": 0.0019465654580408404, "rougeLsum_fmeasure": 0.15222819626322362, "rougeLsum_fmeasure_stderr": 0.0016446268586332612, "rougeLsum_precision": 0.13660282396539003, "rougeLsum_precision_stderr": 0.0019561376555209675, "rougeLsum_recall": 0.21773728025312808, "rougeLsum_recall_stderr": 0.0023396514300470118}}, "3": {"tldr_en": {"bleu": 1.4859120479096923, "bleu_stderr": 0.05574241192906709, "rouge1_fmeasure": 0.13727972794632332, "rouge1_fmeasure_stderr": 0.001966418255252875, "rouge1_precision": 0.1301446922879572, "rouge1_precision_stderr": 0.0023453140077651403, "rouge1_recall": 0.192560590973123, "rouge1_recall_stderr": 0.002831737470965657, "rouge2_fmeasure": 0.025265129695390083, "rouge2_fmeasure_stderr": 0.0007420512125640625, "rouge2_precision": 0.024524184294746752, "rouge2_precision_stderr": 0.0009475897993583641, "rouge2_recall": 0.036259772750247096, "rouge2_recall_stderr": 0.0012047403068686847, "rougeL_fmeasure": 0.10580900761306217, "rougeL_fmeasure_stderr": 0.001429843686104546, "rougeL_precision": 0.10008927585037762, "rougeL_precision_stderr": 0.0017992649861688023, "rougeL_recall": 0.1516749369666555, "rougeL_recall_stderr": 0.0022484203739687827, "rougeLsum_fmeasure": 0.12824788953769048, "rougeLsum_fmeasure_stderr": 0.0018235330304926663, "rougeLsum_precision": 0.12168486458438436, "rougeLsum_precision_stderr": 0.002209541457640191, "rougeLsum_recall": 0.18040752843563596, "rougeLsum_recall_stderr": 0.0026623601517320387}}, "4": {"tldr_en": {"bleu": 0.38983093510263966, "bleu_stderr": 0.020746959439040737, "rouge1_fmeasure": 0.0482938559604652, "rouge1_fmeasure_stderr": 0.0017050539428373885, "rouge1_precision": 0.04687267447236592, "rouge1_precision_stderr": 0.0018998335960580418, "rouge1_recall": 0.07098562737132999, "rouge1_recall_stderr": 0.0025626429489145814, "rouge2_fmeasure": 0.00992332936384645, "rouge2_fmeasure_stderr": 0.0005483941828877055, "rouge2_precision": 0.00945752327909291, "rouge2_precision_stderr": 0.0006557120452244116, "rouge2_recall": 0.01524147181315175, "rouge2_recall_stderr": 0.000968063791685238, "rougeL_fmeasure": 0.03777472015184596, "rougeL_fmeasure_stderr": 0.0012944979133275166, "rougeL_precision": 0.03658048025111141, "rougeL_precision_stderr": 0.0014765804478846238, "rougeL_recall": 0.056879968483736575, "rougeL_recall_stderr": 0.0020708799931085835, "rougeLsum_fmeasure": 0.04480769496337831, "rougeLsum_fmeasure_stderr": 0.0015770553891978325, "rougeLsum_precision": 0.04364094827472193, "rougeLsum_precision_stderr": 0.0017744092995215651, "rougeLsum_recall": 0.06599052444685644, "rougeLsum_recall_stderr": 0.0023914383468420387}}, "5": {"tldr_en": {"bleu": 6.848753994158733e-07, "bleu_stderr": 1.2091205071113564e-06, "rouge1_fmeasure": 0.007816345912784222, "rouge1_fmeasure_stderr": 0.0007612291694346548, "rouge1_precision": 0.007899778364305632, "rouge1_precision_stderr": 0.0008374134090368952, "rouge1_recall": 0.011343564720969444, "rouge1_recall_stderr": 0.0011277127148891929, "rouge2_fmeasure": 0.0017575740188721435, "rouge2_fmeasure_stderr": 0.00024992892095104455, "rouge2_precision": 0.0016948351052204623, "rouge2_precision_stderr": 0.00025208432207753475, "rouge2_recall": 0.002630687274039701, "rouge2_recall_stderr": 0.0004138243186705428, "rougeL_fmeasure": 0.006339645540807284, "rougeL_fmeasure_stderr": 0.0006142715904854269, "rougeL_precision": 0.006320389859749812, "rougeL_precision_stderr": 0.0006593125172728464, "rougeL_recall": 0.009415721615635371, "rougeL_recall_stderr": 0.0009461004389786301, "rougeLsum_fmeasure": 0.007195583841595385, "rougeLsum_fmeasure_stderr": 0.0006939813114362923, "rougeLsum_precision": 0.007348127779079044, "rougeLsum_precision_stderr": 0.0007820257098133964, "rougeLsum_recall": 0.01039809783113184, "rougeLsum_recall_stderr": 0.0010181220364392032}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 0.008438122208283742, "bleu_stderr": 0.001197050519804994, "rouge1_fmeasure": 0.010852991398846181, "rouge1_fmeasure_stderr": 0.00043603376914659093, "rouge1_precision": 0.01731813417190785, "rouge1_precision_stderr": 0.0006904015455150221, "rouge1_recall": 0.008140031462486316, "rouge1_recall_stderr": 0.0003341464417431424, "rouge2_fmeasure": 0.0, "rouge2_fmeasure_stderr": 0.0, "rouge2_precision": 0.0, "rouge2_precision_stderr": 0.0, "rouge2_recall": 0.0, "rouge2_recall_stderr": 0.0, "rougeL_fmeasure": 0.010236948851681334, "rougeL_fmeasure_stderr": 0.00040376061853106, "rougeL_precision": 0.016290356394130068, "rougeL_precision_stderr": 0.0006344252881163902, "rougeL_recall": 0.0076944580577918845, "rougeL_recall_stderr": 0.00031179286190496404, "rougeLsum_fmeasure": 0.010681172391084869, "rougeLsum_fmeasure_stderr": 0.0004270222110231445, "rougeLsum_precision": 0.017040356394130075, "rougeLsum_precision_stderr": 0.0006757816435795186, "rougeLsum_recall": 0.008014275466220572, "rougeLsum_recall_stderr": 0.0003277471469197949}}, "1": {"generate_text_restaurant": {"bleu": 5.415302314455357, "bleu_stderr": 0.08866274485975845, "rouge1_fmeasure": 0.31351772873404504, "rouge1_fmeasure_stderr": 0.0019155579544317606, "rouge1_precision": 0.27518284278158495, "rouge1_precision_stderr": 0.0026904123485453207, "rouge1_recall": 0.44395987313972773, "rouge1_recall_stderr": 0.002853052677955519, "rouge2_fmeasure": 0.1270592371269382, "rouge2_fmeasure_stderr": 0.0013298949590436037, "rouge2_precision": 0.11779839983589596, "rouge2_precision_stderr": 0.0022522445004712227, "rouge2_recall": 0.184152221066327, "rouge2_recall_stderr": 0.002022505610836659, "rougeL_fmeasure": 0.24261441305411593, "rougeL_fmeasure_stderr": 0.0013732549831421876, "rougeL_precision": 0.2142971565592026, "rougeL_precision_stderr": 0.0023228065282473727, "rougeL_recall": 0.3473102442580568, "rougeL_recall_stderr": 0.0023084199885264082, "rougeLsum_fmeasure": 0.2604729426900251, "rougeLsum_fmeasure_stderr": 0.001783692486265605, "rougeLsum_precision": 0.23044400536893825, "rougeLsum_precision_stderr": 0.0025590767181566617, "rougeLsum_recall": 0.3694044441017418, "rougeLsum_recall_stderr": 0.0026884487723429907}}, "2": {"generate_text_restaurant": {"bleu": 6.0835515625006265, "bleu_stderr": 0.13104580918021916, "rouge1_fmeasure": 0.33900310160818814, "rouge1_fmeasure_stderr": 0.001977319155178536, "rouge1_precision": 0.2974677905788029, "rouge1_precision_stderr": 0.0027133762420868996, "rouge1_recall": 0.46824453868512245, "rouge1_recall_stderr": 0.0027816673096099764, "rouge2_fmeasure": 0.14523171565764664, "rouge2_fmeasure_stderr": 0.0014456847848380934, "rouge2_precision": 0.12852946982374805, "rouge2_precision_stderr": 0.001751970024964452, "rouge2_recall": 0.2045106938957861, "rouge2_recall_stderr": 0.002085524555577239, "rougeL_fmeasure": 0.26089415735825394, "rougeL_fmeasure_stderr": 0.0015092210279407214, "rougeL_precision": 0.22768892967881724, "rougeL_precision_stderr": 0.002087880547521337, "rougeL_recall": 0.36418502101759054, "rougeL_recall_stderr": 0.002325817522071071, "rougeLsum_fmeasure": 0.2819640732417153, "rougeLsum_fmeasure_stderr": 0.0019029624581531216, "rougeLsum_precision": 0.2475565846991815, "rougeLsum_precision_stderr": 0.0024501420067594773, "rougeLsum_recall": 0.3901821108140583, "rougeLsum_recall_stderr": 0.002708125972473242}}, "3": {"generate_text_restaurant": {"bleu": 6.191081522703311, "bleu_stderr": 0.08272180666976954, "rouge1_fmeasure": 0.34451701581346555, "rouge1_fmeasure_stderr": 0.0019917632496230047, "rouge1_precision": 0.3059304522321104, "rouge1_precision_stderr": 0.0027936595692492597, "rouge1_recall": 0.4706742638622414, "rouge1_recall_stderr": 0.0027940064831602895, "rouge2_fmeasure": 0.15040030282166134, "rouge2_fmeasure_stderr": 0.0014742918695484102, "rouge2_precision": 0.13437401439677085, "rouge2_precision_stderr": 0.0017741938204701253, "rouge2_recall": 0.2092379893021306, "rouge2_recall_stderr": 0.002098339038549269, "rougeL_fmeasure": 0.26101746069946474, "rougeL_fmeasure_stderr": 0.00152874420852884, "rougeL_precision": 0.23044883331819338, "rougeL_precision_stderr": 0.0021248657249371234, "rougeL_recall": 0.360559914434991, "rougeL_recall_stderr": 0.0023451576403232576, "rougeLsum_fmeasure": 0.28608327236106273, "rougeLsum_fmeasure_stderr": 0.0018907928361422866, "rougeLsum_precision": 0.2535539353339795, "rougeLsum_precision_stderr": 0.002458411594898136, "rougeLsum_recall": 0.3921926325740904, "rougeLsum_recall_stderr": 0.002706349636318779}}, "4": {"generate_text_restaurant": {"bleu": 6.111226061397375, "bleu_stderr": 0.09062441129980986, "rouge1_fmeasure": 0.34431019911907407, "rouge1_fmeasure_stderr": 0.0019747182058236588, "rouge1_precision": 0.30328161795682607, "rouge1_precision_stderr": 0.002708454817254866, "rouge1_recall": 0.4688958080821436, "rouge1_recall_stderr": 0.002671021101118256, "rouge2_fmeasure": 0.15099725848090637, "rouge2_fmeasure_stderr": 0.0014686203885590958, "rouge2_precision": 0.13386033868102898, "rouge2_precision_stderr": 0.001714165558168862, "rouge2_recall": 0.2086704107913658, "rouge2_recall_stderr": 0.0020408838673953386, "rougeL_fmeasure": 0.2590550585031971, "rougeL_fmeasure_stderr": 0.001502995830389098, "rougeL_precision": 0.22638671811775446, "rougeL_precision_stderr": 0.0020039774183955566, "rougeL_recall": 0.35756636848528994, "rougeL_recall_stderr": 0.002297633308443435, "rougeLsum_fmeasure": 0.2853836607666494, "rougeLsum_fmeasure_stderr": 0.001891594019521224, "rougeLsum_precision": 0.2504271029683134, "rougeLsum_precision_stderr": 0.0023554702511328304, "rougeLsum_recall": 0.39039800395209395, "rougeLsum_recall_stderr": 0.002657711797112865}}, "5": {"generate_text_restaurant": {"bleu": 6.157356980483942, "bleu_stderr": 0.07864334022914665, "rouge1_fmeasure": 0.35051512109030886, "rouge1_fmeasure_stderr": 0.0019782779391466078, "rouge1_precision": 0.30466283281999534, "rouge1_precision_stderr": 0.0025978328638333616, "rouge1_recall": 0.4773039407134765, "rouge1_recall_stderr": 0.002664398147764323, "rouge2_fmeasure": 0.15368403663923805, "rouge2_fmeasure_stderr": 0.0014239556304565032, "rouge2_precision": 0.13400973384465575, "rouge2_precision_stderr": 0.0016288510201777058, "rouge2_recall": 0.21289488423428288, "rouge2_recall_stderr": 0.002000085706195211, "rougeL_fmeasure": 0.25918799434536877, "rougeL_fmeasure_stderr": 0.0015032561739134625, "rougeL_precision": 0.22385070378222516, "rougeL_precision_stderr": 0.0019273938628042813, "rougeL_recall": 0.3574082439802802, "rougeL_recall_stderr": 0.002275515159936868, "rougeLsum_fmeasure": 0.2922680755704595, "rougeLsum_fmeasure_stderr": 0.0018749054110706917, "rougeLsum_precision": 0.2535442923717527, "rougeLsum_precision_stderr": 0.0022917134606788734, "rougeLsum_recall": 0.39929532049271077, "rougeLsum_recall_stderr": 0.002600651131060951}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.3129317790470016, "bleu_stderr": 0.07760065268118045, "rouge1_fmeasure": 0.18901821549901887, "rouge1_fmeasure_stderr": 0.002279829129106952, "rouge1_precision": 0.13501905286560467, "rouge1_precision_stderr": 0.0017190548809381608, "rouge1_recall": 0.3283241072423947, "rouge1_recall_stderr": 0.0038525710180174508, "rouge2_fmeasure": 0.03695459182313156, "rouge2_fmeasure_stderr": 0.0012557792366904089, "rouge2_precision": 0.02615731107536162, "rouge2_precision_stderr": 0.0008966873086018211, "rouge2_recall": 0.06575913031162332, "rouge2_recall_stderr": 0.002266591287149122, "rougeL_fmeasure": 0.14412588822347172, "rougeL_fmeasure_stderr": 0.0016582568651692159, "rougeL_precision": 0.1027427586819049, "rougeL_precision_stderr": 0.001244941572662973, "rougeL_recall": 0.252046388299858, "rougeL_recall_stderr": 0.002947806442204036, "rougeLsum_fmeasure": 0.14899415385858006, "rougeLsum_fmeasure_stderr": 0.0019181750290880519, "rougeLsum_precision": 0.10624155578857983, "rougeLsum_precision_stderr": 0.001424582628324823, "rougeLsum_recall": 0.26000319990620885, "rougeLsum_recall_stderr": 0.0033470003654420873}}, "1": {"article_DOC_summary": {"bleu": 0.9224414632472534, "bleu_stderr": 0.08019869073111606, "rouge1_fmeasure": 0.15187372372759875, "rouge1_fmeasure_stderr": 0.002238363045234264, "rouge1_precision": 0.10785786524836369, "rouge1_precision_stderr": 0.00166393179985334, "rouge1_recall": 0.26764764317740486, "rouge1_recall_stderr": 0.003811737165493939, "rouge2_fmeasure": 0.023861206597580405, "rouge2_fmeasure_stderr": 0.0011166771493325116, "rouge2_precision": 0.016853649910436037, "rouge2_precision_stderr": 0.0007934380254041366, "rouge2_recall": 0.04266671919641135, "rouge2_recall_stderr": 0.0020332253461267506, "rougeL_fmeasure": 0.12003447267920726, "rougeL_fmeasure_stderr": 0.0016620315126572962, "rougeL_precision": 0.0850737564631199, "rougeL_precision_stderr": 0.001231208254663744, "rougeL_recall": 0.21291139183497299, "rougeL_recall_stderr": 0.0029192691827101673, "rougeLsum_fmeasure": 0.12165528120740891, "rougeLsum_fmeasure_stderr": 0.001786850495717495, "rougeLsum_precision": 0.08614064999564035, "rougeLsum_precision_stderr": 0.0013137573398773557, "rougeLsum_recall": 0.21627422684982414, "rougeLsum_recall_stderr": 0.0031741815045650216}}, "2": {"article_DOC_summary": {"bleu": 0.7849705282265558, "bleu_stderr": 0.05021581187998352, "rouge1_fmeasure": 0.14992707811107275, "rouge1_fmeasure_stderr": 0.0021846261144537115, "rouge1_precision": 0.1062226714370173, "rouge1_precision_stderr": 0.0016313647653793566, "rouge1_recall": 0.2649518628728813, "rouge1_recall_stderr": 0.003652381902131823, "rouge2_fmeasure": 0.022554691732547677, "rouge2_fmeasure_stderr": 0.0010629952996922107, "rouge2_precision": 0.01588044344088591, "rouge2_precision_stderr": 0.0007537881734122496, "rouge2_recall": 0.04053986486635946, "rouge2_recall_stderr": 0.0019391443831652793, "rougeL_fmeasure": 0.11929556728475006, "rougeL_fmeasure_stderr": 0.0016092633921978442, "rougeL_precision": 0.08432740681651495, "rougeL_precision_stderr": 0.0011919454883656977, "rougeL_recall": 0.21219568397714195, "rougeL_recall_stderr": 0.00280778428980714, "rougeLsum_fmeasure": 0.11841507440799803, "rougeLsum_fmeasure_stderr": 0.0017311352559642463, "rougeLsum_precision": 0.08362060554920302, "rougeLsum_precision_stderr": 0.0012757122592231506, "rougeLsum_recall": 0.21114568653248753, "rougeLsum_recall_stderr": 0.003020669313336447}}, "3": {"article_DOC_summary": {"bleu": 0.7190258437509995, "bleu_stderr": 0.042187577531458346, "rouge1_fmeasure": 0.13810451001882001, "rouge1_fmeasure_stderr": 0.0022714225587039667, "rouge1_precision": 0.10057846011875604, "rouge1_precision_stderr": 0.0018497294107205577, "rouge1_recall": 0.23942926779906215, "rouge1_recall_stderr": 0.003842497556321712, "rouge2_fmeasure": 0.019896507185675868, "rouge2_fmeasure_stderr": 0.0010117990051707437, "rouge2_precision": 0.014408897494360922, "rouge2_precision_stderr": 0.0007527082518367464, "rouge2_recall": 0.035145702586454476, "rouge2_recall_stderr": 0.0018205243537310583, "rougeL_fmeasure": 0.11124617587091595, "rougeL_fmeasure_stderr": 0.0017443372993626053, "rougeL_precision": 0.08102526691338699, "rougeL_precision_stderr": 0.0014626039759259395, "rougeL_recall": 0.19354330349683008, "rougeL_recall_stderr": 0.0029953557840955284, "rougeLsum_fmeasure": 0.11048932831500144, "rougeLsum_fmeasure_stderr": 0.0018170680342048896, "rougeLsum_precision": 0.0803671735666726, "rougeLsum_precision_stderr": 0.0015024060943462886, "rougeLsum_recall": 0.1928976711119303, "rougeLsum_recall_stderr": 0.003150396864481297}}, "4": {"article_DOC_summary": {"bleu": 0.32351273593768703, "bleu_stderr": 0.08540381984004876, "rouge1_fmeasure": 0.03779629267333967, "rouge1_fmeasure_stderr": 0.002174444567033052, "rouge1_precision": 0.03173204900268027, "rouge1_precision_stderr": 0.002027826208658339, "rouge1_recall": 0.05989088557122078, "rouge1_recall_stderr": 0.0034559892001691417, "rouge2_fmeasure": 0.005239892494254664, "rouge2_fmeasure_stderr": 0.0005866501971322619, "rouge2_precision": 0.004425484224867963, "rouge2_precision_stderr": 0.000643504684134592, "rouge2_recall": 0.008676763065921654, "rouge2_recall_stderr": 0.0009869539677775623, "rougeL_fmeasure": 0.030163301894705917, "rougeL_fmeasure_stderr": 0.0017082556309796733, "rougeL_precision": 0.025562577011753043, "rougeL_precision_stderr": 0.0016557292706477333, "rougeL_recall": 0.04810137820818986, "rougeL_recall_stderr": 0.002762103216085477, "rougeLsum_fmeasure": 0.030777834462545225, "rougeLsum_fmeasure_stderr": 0.0017676759430837576, "rougeLsum_precision": 0.026108776067360468, "rougeLsum_precision_stderr": 0.0017169750619199886, "rougeLsum_recall": 0.04912097715557878, "rougeLsum_recall_stderr": 0.002853073868806013}}, "5": {"article_DOC_summary": {"bleu": 1.0347712018500012e-39, "bleu_stderr": 1.5407113142608347e-34, "rouge1_fmeasure": 0.002313684367811786, "rouge1_fmeasure_stderr": 0.0006507326736497126, "rouge1_precision": 0.0028066473138469166, "rouge1_precision_stderr": 0.0008207012823296872, "rouge1_recall": 0.0020864639544280125, "rouge1_recall_stderr": 0.0005806543667432164, "rouge2_fmeasure": 0.00019304594776292888, "rouge2_fmeasure_stderr": 9.705711124778186e-05, "rouge2_precision": 0.00023749835070589783, "rouge2_precision_stderr": 0.0001188407936767355, "rouge2_recall": 0.0001673483748955447, "rouge2_recall_stderr": 8.57618183045581e-05, "rougeL_fmeasure": 0.001631869743854381, "rougeL_fmeasure_stderr": 0.00043610635442712287, "rougeL_precision": 0.0019047789901811747, "rougeL_precision_stderr": 0.0005159501799768975, "rougeL_recall": 0.0015276752695243573, "rougeL_recall_stderr": 0.0004218946829627963, "rougeLsum_fmeasure": 0.0018840090143813742, "rougeLsum_fmeasure_stderr": 0.0005098533594631085, "rougeLsum_precision": 0.002236816201562974, "rougeLsum_precision_stderr": 0.0006238629929594013, "rougeLsum_recall": 0.0017355764056056515, "rougeLsum_recall_stderr": 0.0004749539743411232}}}} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d479ee4656a4de4a921c76f943f9a56dcfc5eb54 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.2850756553878694, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.029479244787540198 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06307795392559021, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018961573476995012 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2519437334576553, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0046233665666279115 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09250286063498843, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0021321582297043904 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.031169579486007647, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0013315121763508673 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.12406823641780289, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003056908408498049 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.044919822948790884, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013419119538143087 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.060512962960882884, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0017532071667563402 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.24591537295391636, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004506544617650046 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08915644889918124, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0019635255248017934 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.060137684271610675, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017836800848927256 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.24092589731633912, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004306266650112688 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.0881964727255614, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00197619826433602 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ed61e59c5fb13372c918b04d01620100d48854ce --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.24801641089701984, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.011989470193668068 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.05818517766037036, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014819995423263183 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2827362020383282, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00480569342082808 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.08959675554256848, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018375399876627346 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.02635367956564326, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009528048262941789 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.12704223429697128, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0030597437559013066 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04016977243576677, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011455508827807554 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05484150466192377, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001315703805718461 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2667301815318325, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004372221951900707 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08471881476079753, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016703735129750064 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.055740125805322414, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014190378903881072 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.26919922518521233, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004429470047755656 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.08576130624221133, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017402119865819162 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..b2fce53f916f5e098deb93d49c904e61ebd05d58 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.2530185878500052, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.012040289243788763 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.058512763074349945, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001317655981799918 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.28742836834463886, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004669386290992104 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09138094990191768, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001796675120671757 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.02660128395309018, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007990003962669926 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.13371012137028607, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003130626897597201 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.041518797800848606, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011144817093188633 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05542859482898103, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011932242274819006 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2719360787885418, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0042608863041157016 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08671939835151828, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016448408963673205 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.056182111716967645, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001251228891614172 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2754066562262308, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004372289191944523 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.08775702388632066, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017074743673142906 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..2ad832ad6497895cb24051b32c4195ebfb65c2c6 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.26104356935100076, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.020606892130089625 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.05876875730987439, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001262923124165934 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2978570511134094, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004772108557819704 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09225925338125805, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017393497174197025 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.026266986693919324, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007684696212875827 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.13694139873828265, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032263532566755484 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.041225163728007774, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010870715838513074 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05552067895103241, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011567152896671338 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.27953358851668986, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004336840965548908 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08719695353070112, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016039844889244289 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.05648619086001838, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001210169007089921 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.28427881728747934, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004454752297972069 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.08861162982557379, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016648356514252724 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..da3c33df21bef5c418e67d699ecb99154982399b --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.29578242700897045, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.01644855391604288 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.059241759487365105, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013185605514960156 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2941689602060997, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004782582061622861 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09236209607564469, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017155296399348975 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.026700072260856023, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008329146326999274 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.13703029324122062, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032032363310221562 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04146292001846389, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010710528467515177 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05584064201532722, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011822227694518028 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2765136016304282, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004355885247911899 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.0871975029360322, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015832095836349604 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.056809260000044604, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012651199781666866 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.28080366233461934, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004447560399921803 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.08849785197136012, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001631762057927943 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..9eeb4deebe9c7bc4ebc67859eedcd968e3240c77 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3072581712947307, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.013011180740751221 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.05956004848850282, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0011844820103012758 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3050141575766028, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004806860152049065 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09385006352878718, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016492746708198635 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.02671744686752806, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007193199514761142 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1433762159365779, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003204965724880526 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04219069561770858, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010275629961263655 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.056371808160412054, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011227434161722896 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.28550365697556257, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004319358585933794 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08869899339649662, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015565597321756607 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.057099278638911184, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001138102224001842 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2910079263017007, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0044961239015304435 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.08990792464666136, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015790820849768395 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..4999c5431ff78218386837ffc1c92b083e07029b --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.13418128757490422, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019073144542996227 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.22370464176226834, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002611499109099858 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1561377606426544, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018912371468179697 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.025327472863282418, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007106910143569577 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04305842511949861, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012262998119789712 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.029464599857488446, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007789826555536276 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10545228491836044, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001352449912251029 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1823578443380979, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002113773481771066 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12424387461861276, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.00136977188181699 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.12317282152669443, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001738142219855923 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.20632202845312703, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002412292367994964 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.143508075517125, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017239605017566344 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.321761515529462, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06405890291232123 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..cd69d9f7c969f6590f40f8c80daae7d39600ef8b --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.14320491367082974, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0017845301991567476 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.24137867619505146, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0025607829167710225 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.16584774157614826, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00170618534117368 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.024138151973368126, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006642056284954163 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04339348127802618, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0013577106434495858 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.028239833468568194, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000742179114763329 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10239786671559123, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011893616487463725 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.17945313333907692, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.001974005906098066 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1198532739033359, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001127314183736604 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1340667845076243, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001657309035299111 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2269067249445735, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0024213993165733594 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15540160642759504, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015831136631871156 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.3666198009021433, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02548342731902 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..4be20f2e82da51d6b28184747cff3c409ad568b1 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1458694998331044, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0020751465219441393 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.23221929546910855, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0024940559594616818 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.16273042831855172, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001775802427873928 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.026699811383133716, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009124914873931906 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04136532269717438, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0011921194612908434 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.028547689348404154, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007464823189898568 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10982415140479714, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015215433681870106 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.18026503948966904, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0019465654580408404 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12326647530268532, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012253014530928786 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13660282396539003, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0019561376555209675 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.21773728025312808, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0023396514300470118 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15222819626322362, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016446268586332612 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.330687803868559, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05809493878615601 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..79c17b0381b4cf91bd49c7441b25a43cf7d4d057 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1301446922879572, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0023453140077651403 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.192560590973123, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002831737470965657 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.13727972794632332, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001966418255252875 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.024524184294746752, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009475897993583641 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.036259772750247096, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012047403068686847 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.025265129695390083, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007420512125640625 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10008927585037762, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0017992649861688023 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1516749369666555, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022484203739687827 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.10580900761306217, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001429843686104546 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.12168486458438436, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002209541457640191 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.18040752843563596, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026623601517320387 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.12824788953769048, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018235330304926663 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.4859120479096923, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05574241192906709 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..2a0f4c14c2069cff3d0c9d4da4d77966c3778ec7 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.04687267447236592, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018998335960580418 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.07098562737132999, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0025626429489145814 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.0482938559604652, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017050539428373885 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.00945752327909291, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006557120452244116 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.01524147181315175, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.000968063791685238 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.00992332936384645, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0005483941828877055 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.03658048025111141, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014765804478846238 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.056879968483736575, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0020708799931085835 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.03777472015184596, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012944979133275166 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.04364094827472193, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017744092995215651 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.06599052444685644, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0023914383468420387 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.04480769496337831, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015770553891978325 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.38983093510263966, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.020746959439040737 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..cb56ba99fbcffefa4b7c46f6d8e52f6409de72a4 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.007899778364305632, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0008374134090368952 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.011343564720969444, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0011277127148891929 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.007816345912784222, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0007612291694346548 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0016948351052204623, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00025208432207753475 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.002630687274039701, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0004138243186705428 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0017575740188721435, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00024992892095104455 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.006320389859749812, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0006593125172728464 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.009415721615635371, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0009461004389786301 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006339645540807284, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006142715904854269 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.007348127779079044, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0007820257098133964 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.01039809783113184, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0010181220364392032 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.007195583841595385, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0006939813114362923 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 6.848753994158733e-07, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 1.2091205071113564e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..aedc915d551255513e6311ef336375b16603385e --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.008438122208283742, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.001197050519804994 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.01731813417190785, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0006904015455150221 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.008140031462486316, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0003341464417431424 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.010852991398846181, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.00043603376914659093 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.0, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.0, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.0, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.016290356394130068, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0006344252881163902 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.0076944580577918845, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.00031179286190496404 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.010236948851681334, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.00040376061853106 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.017040356394130075, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0006757816435795186 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.008014275466220572, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0003277471469197949 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.010681172391084869, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0004270222110231445 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..9fa5437067b9547a1f03bacb7ec4cc8b2a397afa --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.415302314455357, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.08866274485975845 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.27518284278158495, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0026904123485453207 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.44395987313972773, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002853052677955519 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.31351772873404504, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0019155579544317606 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.11779839983589596, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0022522445004712227 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.184152221066327, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002022505610836659 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.1270592371269382, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0013298949590436037 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2142971565592026, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0023228065282473727 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3473102442580568, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023084199885264082 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.24261441305411593, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0013732549831421876 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.23044400536893825, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0025590767181566617 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3694044441017418, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026884487723429907 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2604729426900251, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001783692486265605 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..0a3b879fb86f5b130da140c15e03267dc60d1488 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.0835515625006265, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.13104580918021916 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.2974677905788029, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0027133762420868996 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.46824453868512245, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027816673096099764 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.33900310160818814, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.001977319155178536 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.12852946982374805, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.001751970024964452 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2045106938957861, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002085524555577239 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.14523171565764664, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0014456847848380934 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.22768892967881724, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002087880547521337 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.36418502101759054, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002325817522071071 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.26089415735825394, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015092210279407214 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2475565846991815, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0024501420067594773 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3901821108140583, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002708125972473242 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2819640732417153, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019029624581531216 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..e8c64c29a2ee74a24dff34383a9cde07a2674cce --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.191081522703311, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.08272180666976954 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3059304522321104, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0027936595692492597 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4706742638622414, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027940064831602895 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.34451701581346555, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0019917632496230047 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.13437401439677085, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0017741938204701253 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2092379893021306, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002098339038549269 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.15040030282166134, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0014742918695484102 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.23044883331819338, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0021248657249371234 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.360559914434991, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023451576403232576 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.26101746069946474, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.00152874420852884 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2535539353339795, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002458411594898136 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3921926325740904, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002706349636318779 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.28608327236106273, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018907928361422866 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..bbb64b6db092b3b99e062f2c4603c437b81a08d1 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.111226061397375, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.09062441129980986 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.30328161795682607, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002708454817254866 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4688958080821436, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002671021101118256 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.34431019911907407, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0019747182058236588 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.13386033868102898, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.001714165558168862 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2086704107913658, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0020408838673953386 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.15099725848090637, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0014686203885590958 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.22638671811775446, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0020039774183955566 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.35756636848528994, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002297633308443435 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2590550585031971, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001502995830389098 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2504271029683134, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0023554702511328304 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.39039800395209395, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002657711797112865 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2853836607666494, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001891594019521224 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..81828fe3c94ae23c9c19e244f18195a665180cdd --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.157356980483942, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.07864334022914665 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.30466283281999534, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0025978328638333616 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4773039407134765, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002664398147764323 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.35051512109030886, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0019782779391466078 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.13400973384465575, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0016288510201777058 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21289488423428288, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002000085706195211 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.15368403663923805, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0014239556304565032 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.22385070378222516, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0019273938628042813 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3574082439802802, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002275515159936868 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.25918799434536877, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015032561739134625 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2535442923717527, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0022917134606788734 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.39929532049271077, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002600651131060951 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2922680755704595, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018749054110706917 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_0.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d8bfefc6f8d6c24e56b3819b5dc01afdc47163da --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.13501905286560467, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017190548809381608 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3283241072423947, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0038525710180174508 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.18901821549901887, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002279829129106952 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02615731107536162, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0008966873086018211 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06575913031162332, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002266591287149122 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03695459182313156, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0012557792366904089 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1027427586819049, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001244941572662973 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.252046388299858, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002947806442204036 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14412588822347172, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0016582568651692159 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10624155578857983, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001424582628324823 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.26000319990620885, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0033470003654420873 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14899415385858006, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019181750290880519 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.3129317790470016, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07760065268118045 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_1.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..27b33e07b0eaac5afff69b6bbe7c8d9e7eb3c6f8 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.10785786524836369, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.00166393179985334 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.26764764317740486, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003811737165493939 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.15187372372759875, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002238363045234264 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.016853649910436037, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0007934380254041366 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.04266671919641135, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0020332253461267506 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.023861206597580405, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0011166771493325116 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0850737564631199, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001231208254663744 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.21291139183497299, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0029192691827101673 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.12003447267920726, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0016620315126572962 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.08614064999564035, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0013137573398773557 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.21627422684982414, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0031741815045650216 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.12165528120740891, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.001786850495717495 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.9224414632472534, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08019869073111606 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_2.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..cddd7015630ab30d5fbd626be4584fa78ac95d90 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1062226714370173, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0016313647653793566 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2649518628728813, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003652381902131823 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.14992707811107275, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0021846261144537115 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.01588044344088591, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0007537881734122496 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.04053986486635946, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0019391443831652793 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.022554691732547677, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0010629952996922107 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08432740681651495, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0011919454883656977 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.21219568397714195, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.00280778428980714 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.11929556728475006, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0016092633921978442 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.08362060554920302, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0012757122592231506 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.21114568653248753, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003020669313336447 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.11841507440799803, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0017311352559642463 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.7849705282265558, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.05021581187998352 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_3.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..c8346ea3cb5201f61292d679af6315cb84cd1641 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.10057846011875604, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018497294107205577 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.23942926779906215, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003842497556321712 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.13810451001882001, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0022714225587039667 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.014408897494360922, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0007527082518367464 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.035145702586454476, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0018205243537310583 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.019896507185675868, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0010117990051707437 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08102526691338699, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0014626039759259395 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.19354330349683008, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0029953557840955284 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.11124617587091595, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0017443372993626053 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0803671735666726, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0015024060943462886 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.1928976711119303, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003150396864481297 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.11048932831500144, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0018170680342048896 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.7190258437509995, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.042187577531458346 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_4.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..1535e336a63f620f7733a9ad43df072382abf88b --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.03173204900268027, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002027826208658339 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.05989088557122078, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0034559892001691417 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.03779629267333967, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002174444567033052 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.004425484224867963, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.000643504684134592 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.008676763065921654, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0009869539677775623 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.005239892494254664, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0005866501971322619 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.025562577011753043, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0016557292706477333 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.04810137820818986, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002762103216085477 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.030163301894705917, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0017082556309796733 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.026108776067360468, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0017169750619199886 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.04912097715557878, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.002853073868806013 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.030777834462545225, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0017676759430837576 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.32351273593768703, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08540381984004876 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_5.json b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..52589f1b2fea12fd11ba4b3fff9aad9861c9b1bf --- /dev/null +++ b/1b121b21bc4seed2/evaluation/generation/slim.1b121b21bc4seed2_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0028066473138469166, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0008207012823296872 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0020864639544280125, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0005806543667432164 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.002313684367811786, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0006507326736497126 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.00023749835070589783, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0001188407936767355 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0001673483748955447, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 8.57618183045581e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.00019304594776292888, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 9.705711124778186e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0019047789901811747, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0005159501799768975 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0015276752695243573, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0004218946829627963 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.001631869743854381, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.00043610635442712287 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.002236816201562974, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0006238629929594013 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0017355764056056515, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0004749539743411232 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0018840090143813742, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0005098533594631085 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.0347712018500012e-39, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 1.5407113142608347e-34 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_0.csv b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..fab69326320c8dbc588e7ce92eafbb14bf2fa7ed --- /dev/null +++ b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.334,0.01492201952373296,0 +anli_r2,acc,0.339,0.014976758771620344,0 +anli_r3,acc,0.33,0.013579531277800922,0 +arc_challenge,acc,0.22610921501706485,0.012224202097063288,0 +arc_challenge,acc_norm,0.2645051194539249,0.01288927294931337,0 +arc_easy,acc,0.5143097643097643,0.010255580881603627,0 +arc_easy,acc_norm,0.44486531986531985,0.010197216690356413,0 +boolq,acc,0.5697247706422018,0.008659608602932497,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.25247782994261864,,1 +copa,acc,0.7,0.046056618647183814,0 +hellaswag,acc,0.35222067317267475,0.004766860907171548,0 +hellaswag,acc_norm,0.43198566022704643,0.004943400892881058,0 +piqa,acc,0.705114254624592,0.010639030620157001,0 +piqa,acc_norm,0.6980413492927094,0.010711732891588338,0 +rte,acc,0.5379061371841155,0.03000984891252912,0 +sciq,acc,0.752,0.01366318713487766,0 +sciq,acc_norm,0.667,0.014910846164229859,0 +storycloze_2016,acc,0.6397648316408338,0.011101519668493525,0 +winogrande,acc,0.5209155485398579,0.014040185494212949,0 diff --git a/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_0.json b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_0.json new file mode 100644 index 0000000000000000000000000000000000000000..cd52ffdb28b4132da057943968a3fbb875166737 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.334, + "acc_stderr": 0.01492201952373296 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620344 + }, + "anli_r3": { + "acc": 0.33, + "acc_stderr": 0.013579531277800922 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.25247782994261864 + }, + "copa": { + "acc": 0.7, + "acc_stderr": 0.046056618647183814 + }, + "hellaswag": { + "acc": 0.35222067317267475, + "acc_stderr": 0.004766860907171548, + "acc_norm": 0.43198566022704643, + "acc_norm_stderr": 0.004943400892881058 + }, + "rte": { + "acc": 0.5379061371841155, + "acc_stderr": 0.03000984891252912 + }, + "winogrande": { + "acc": 0.5209155485398579, + "acc_stderr": 0.014040185494212949 + }, + "storycloze_2016": { + "acc": 0.6397648316408338, + "acc_stderr": 0.011101519668493525 + }, + "boolq": { + "acc": 0.5697247706422018, + "acc_stderr": 0.008659608602932497 + }, + "arc_easy": { + "acc": 0.5143097643097643, + "acc_stderr": 0.010255580881603627, + "acc_norm": 0.44486531986531985, + "acc_norm_stderr": 0.010197216690356413 + }, + "arc_challenge": { + "acc": 0.22610921501706485, + "acc_stderr": 0.012224202097063288, + "acc_norm": 0.2645051194539249, + "acc_norm_stderr": 0.01288927294931337 + }, + "sciq": { + "acc": 0.752, + "acc_stderr": 0.01366318713487766, + "acc_norm": 0.667, + "acc_norm_stderr": 0.014910846164229859 + }, + "piqa": { + "acc": 0.705114254624592, + "acc_stderr": 0.010639030620157001, + "acc_norm": 0.6980413492927094, + "acc_norm_stderr": 0.010711732891588338 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_1.csv b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..91d6efcc91ecab7f8595d73bd68d50c29fd3d6df --- /dev/null +++ b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.336,0.014944140233795023,0 +anli_r2,acc,0.35,0.015090650341444235,0 +anli_r3,acc,0.32916666666666666,0.013570806258433616,0 +arc_challenge,acc,0.2226962457337884,0.012158314774829928,0 +arc_challenge,acc_norm,0.2645051194539249,0.012889272949313368,0 +arc_easy,acc,0.5054713804713805,0.010259169228615046,0 +arc_easy,acc_norm,0.4541245791245791,0.010216507710244096,0 +boolq,acc,0.5397553516819572,0.00871736823978605,1 +cb,acc,0.5178571428571429,0.06737697508644648,1 +cb,f1,0.35609696074812347,,1 +copa,acc,0.7,0.046056618647183814,0 +hellaswag,acc,0.3514240191196973,0.0047643939851110305,0 +hellaswag,acc_norm,0.43238398725353516,0.0049439450696114485,0 +piqa,acc,0.7013057671381937,0.01067855639814924,0 +piqa,acc_norm,0.6958650707290533,0.01073349333572131,0 +rte,acc,0.5487364620938628,0.029953149241808946,0 +sciq,acc,0.805,0.01253523562331933,0 +sciq,acc_norm,0.739,0.01389503767796513,0 +storycloze_2016,acc,0.6312132549438803,0.011157191913955243,0 +winogrande,acc,0.5335438042620363,0.0140208266775981,0 diff --git a/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_1.json b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f6a01492f4969ba0e1ef1fdcbbe71de012b680ee --- /dev/null +++ b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.014944140233795023 + }, + "anli_r2": { + "acc": 0.35, + "acc_stderr": 0.015090650341444235 + }, + "anli_r3": { + "acc": 0.32916666666666666, + "acc_stderr": 0.013570806258433616 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644648, + "f1": 0.35609696074812347 + }, + "copa": { + "acc": 0.7, + "acc_stderr": 0.046056618647183814 + }, + "hellaswag": { + "acc": 0.3514240191196973, + "acc_stderr": 0.0047643939851110305, + "acc_norm": 0.43238398725353516, + "acc_norm_stderr": 0.0049439450696114485 + }, + "rte": { + "acc": 0.5487364620938628, + "acc_stderr": 0.029953149241808946 + }, + "winogrande": { + "acc": 0.5335438042620363, + "acc_stderr": 0.0140208266775981 + }, + "storycloze_2016": { + "acc": 0.6312132549438803, + "acc_stderr": 0.011157191913955243 + }, + "boolq": { + "acc": 0.5397553516819572, + "acc_stderr": 0.00871736823978605 + }, + "arc_easy": { + "acc": 0.5054713804713805, + "acc_stderr": 0.010259169228615046, + "acc_norm": 0.4541245791245791, + "acc_norm_stderr": 0.010216507710244096 + }, + "arc_challenge": { + "acc": 0.2226962457337884, + "acc_stderr": 0.012158314774829928, + "acc_norm": 0.2645051194539249, + "acc_norm_stderr": 0.012889272949313368 + }, + "sciq": { + "acc": 0.805, + "acc_stderr": 0.01253523562331933, + "acc_norm": 0.739, + "acc_norm_stderr": 0.01389503767796513 + }, + "piqa": { + "acc": 0.7013057671381937, + "acc_stderr": 0.01067855639814924, + "acc_norm": 0.6958650707290533, + "acc_norm_stderr": 0.01073349333572131 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_2.csv b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..e07fa14d9e67aeacf4630bbfe5c19b1d83d6fbdd --- /dev/null +++ b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.326,0.014830507204541044,0 +anli_r2,acc,0.335,0.014933117490932577,0 +anli_r3,acc,0.33666666666666667,0.01364760294240639,0 +arc_challenge,acc,0.21075085324232082,0.01191827175485218,0 +arc_challenge,acc_norm,0.2525597269624573,0.012696728980207704,0 +arc_easy,acc,0.5227272727272727,0.01024917909060597,0 +arc_easy,acc_norm,0.4903198653198653,0.010257860554461122,0 +boolq,acc,0.5467889908256881,0.00870668126587249,1 +cb,acc,0.44642857142857145,0.06703189227942398,1 +cb,f1,0.2790890269151139,,1 +copa,acc,0.65,0.047937248544110196,0 +hellaswag,acc,0.35132443736307506,0.004764084597176907,0 +hellaswag,acc_norm,0.4304919338777136,0.0049413312155985566,0 +piqa,acc,0.6980413492927094,0.010711732891588352,0 +piqa,acc_norm,0.6926006528835691,0.010765602506939063,0 +rte,acc,0.48736462093862815,0.030086851767188564,0 +sciq,acc,0.817,0.012233587399477828,0 +sciq,acc_norm,0.787,0.012953717566737216,0 +storycloze_2016,acc,0.6312132549438803,0.01115719191395524,0 +winogrande,acc,0.5311760063141279,0.014025142640639515,0 diff --git a/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_2.json b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_2.json new file mode 100644 index 0000000000000000000000000000000000000000..fa0ada70d96284a3755505df333532d30f3ef6ae --- /dev/null +++ b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.326, + "acc_stderr": 0.014830507204541044 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.014933117490932577 + }, + "anli_r3": { + "acc": 0.33666666666666667, + "acc_stderr": 0.01364760294240639 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942398, + "f1": 0.2790890269151139 + }, + "copa": { + "acc": 0.65, + "acc_stderr": 0.047937248544110196 + }, + "hellaswag": { + "acc": 0.35132443736307506, + "acc_stderr": 0.004764084597176907, + "acc_norm": 0.4304919338777136, + "acc_norm_stderr": 0.0049413312155985566 + }, + "rte": { + "acc": 0.48736462093862815, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5311760063141279, + "acc_stderr": 0.014025142640639515 + }, + "storycloze_2016": { + "acc": 0.6312132549438803, + "acc_stderr": 0.01115719191395524 + }, + "boolq": { + "acc": 0.5467889908256881, + "acc_stderr": 0.00870668126587249 + }, + "arc_easy": { + "acc": 0.5227272727272727, + "acc_stderr": 0.01024917909060597, + "acc_norm": 0.4903198653198653, + "acc_norm_stderr": 0.010257860554461122 + }, + "arc_challenge": { + "acc": 0.21075085324232082, + "acc_stderr": 0.01191827175485218, + "acc_norm": 0.2525597269624573, + "acc_norm_stderr": 0.012696728980207704 + }, + "sciq": { + "acc": 0.817, + "acc_stderr": 0.012233587399477828, + "acc_norm": 0.787, + "acc_norm_stderr": 0.012953717566737216 + }, + "piqa": { + "acc": 0.6980413492927094, + "acc_stderr": 0.010711732891588352, + "acc_norm": 0.6926006528835691, + "acc_norm_stderr": 0.010765602506939063 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_3.csv b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..49c9600cfc1c4dfe02d656d686d5fb35aa703844 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.329,0.014865395385928381,0 +anli_r2,acc,0.344,0.015029633724408948,0 +anli_r3,acc,0.3458333333333333,0.01373624534231101,0 +arc_challenge,acc,0.2235494880546075,0.01217489663120261,0 +arc_challenge,acc_norm,0.2593856655290102,0.012808273573927099,0 +arc_easy,acc,0.5155723905723906,0.01025480633196189,0 +arc_easy,acc_norm,0.48695286195286197,0.010256289925058452,0 +boolq,acc,0.5425076452599389,0.00871339478784262,1 +cb,acc,0.5357142857142857,0.06724777654937658,1 +cb,f1,0.3263888888888889,,1 +copa,acc,0.71,0.045604802157206845,0 +hellaswag,acc,0.3536148177653854,0.004771143074426134,0 +hellaswag,acc_norm,0.4326827325234017,0.004944351065545855,0 +piqa,acc,0.6980413492927094,0.010711732891588352,0 +piqa,acc_norm,0.6985854189336235,0.01070624824275376,0 +rte,acc,0.5234657039711191,0.03006330041190266,0 +sciq,acc,0.822,0.012102167676183592,0 +sciq,acc_norm,0.787,0.012953717566737221,0 +storycloze_2016,acc,0.6349545697487974,0.011133301783914872,0 +winogrande,acc,0.5430149960536701,0.01400038676159829,0 diff --git a/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_3.json b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_3.json new file mode 100644 index 0000000000000000000000000000000000000000..5278ca8903ecbebd6bc7bed8e58818c2dad6691a --- /dev/null +++ b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.329, + "acc_stderr": 0.014865395385928381 + }, + "anli_r2": { + "acc": 0.344, + "acc_stderr": 0.015029633724408948 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.01373624534231101 + }, + "cb": { + "acc": 0.5357142857142857, + "acc_stderr": 0.06724777654937658, + "f1": 0.3263888888888889 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.045604802157206845 + }, + "hellaswag": { + "acc": 0.3536148177653854, + "acc_stderr": 0.004771143074426134, + "acc_norm": 0.4326827325234017, + "acc_norm_stderr": 0.004944351065545855 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.5430149960536701, + "acc_stderr": 0.01400038676159829 + }, + "storycloze_2016": { + "acc": 0.6349545697487974, + "acc_stderr": 0.011133301783914872 + }, + "boolq": { + "acc": 0.5425076452599389, + "acc_stderr": 0.00871339478784262 + }, + "arc_easy": { + "acc": 0.5155723905723906, + "acc_stderr": 0.01025480633196189, + "acc_norm": 0.48695286195286197, + "acc_norm_stderr": 0.010256289925058452 + }, + "arc_challenge": { + "acc": 0.2235494880546075, + "acc_stderr": 0.01217489663120261, + "acc_norm": 0.2593856655290102, + "acc_norm_stderr": 0.012808273573927099 + }, + "sciq": { + "acc": 0.822, + "acc_stderr": 0.012102167676183592, + "acc_norm": 0.787, + "acc_norm_stderr": 0.012953717566737221 + }, + "piqa": { + "acc": 0.6980413492927094, + "acc_stderr": 0.010711732891588352, + "acc_norm": 0.6985854189336235, + "acc_norm_stderr": 0.01070624824275376 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_4.csv b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..c679aa28ae6a88782dd35c4281a12aa914fe8ec2 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.338,0.014965960710224473,0 +anli_r2,acc,0.339,0.014976758771620344,0 +anli_r3,acc,0.3383333333333333,0.01366414400661827,0 +arc_challenge,acc,0.2150170648464164,0.012005717634133604,0 +arc_challenge,acc_norm,0.2593856655290102,0.012808273573927095,0 +arc_easy,acc,0.5210437710437711,0.01025069260202257,0 +arc_easy,acc_norm,0.49957912457912457,0.01025977988609443,0 +boolq,acc,0.5397553516819572,0.00871736823978605,1 +cb,acc,0.5178571428571429,0.06737697508644647,1 +cb,f1,0.2908378541289934,,1 +copa,acc,0.66,0.04760952285695237,0 +hellaswag,acc,0.351822346146186,0.004765629263643523,0 +hellaswag,acc_norm,0.4320852419836686,0.0049435372423444176,0 +piqa,acc,0.6947769314472253,0.01074426704560648,0 +piqa,acc_norm,0.6969532100108814,0.0107226486895315,0 +rte,acc,0.48736462093862815,0.030086851767188564,0 +sciq,acc,0.824,0.01204861689859752,0 +sciq,acc_norm,0.801,0.012631649083099179,0 +storycloze_2016,acc,0.6386958845537146,0.011108686479432282,0 +winogrande,acc,0.5335438042620363,0.0140208266775981,0 diff --git a/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_4.json b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_4.json new file mode 100644 index 0000000000000000000000000000000000000000..9fbe55bcf2071d8c49455688a94c7bb9b394a0a6 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.338, + "acc_stderr": 0.014965960710224473 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620344 + }, + "anli_r3": { + "acc": 0.3383333333333333, + "acc_stderr": 0.01366414400661827 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.2908378541289934 + }, + "copa": { + "acc": 0.66, + "acc_stderr": 0.04760952285695237 + }, + "hellaswag": { + "acc": 0.351822346146186, + "acc_stderr": 0.004765629263643523, + "acc_norm": 0.4320852419836686, + "acc_norm_stderr": 0.0049435372423444176 + }, + "rte": { + "acc": 0.48736462093862815, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5335438042620363, + "acc_stderr": 0.0140208266775981 + }, + "storycloze_2016": { + "acc": 0.6386958845537146, + "acc_stderr": 0.011108686479432282 + }, + "boolq": { + "acc": 0.5397553516819572, + "acc_stderr": 0.00871736823978605 + }, + "arc_easy": { + "acc": 0.5210437710437711, + "acc_stderr": 0.01025069260202257, + "acc_norm": 0.49957912457912457, + "acc_norm_stderr": 0.01025977988609443 + }, + "arc_challenge": { + "acc": 0.2150170648464164, + "acc_stderr": 0.012005717634133604, + "acc_norm": 0.2593856655290102, + "acc_norm_stderr": 0.012808273573927095 + }, + "sciq": { + "acc": 0.824, + "acc_stderr": 0.01204861689859752, + "acc_norm": 0.801, + "acc_norm_stderr": 0.012631649083099179 + }, + "piqa": { + "acc": 0.6947769314472253, + "acc_stderr": 0.01074426704560648, + "acc_norm": 0.6969532100108814, + "acc_norm_stderr": 0.0107226486895315 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_5.csv b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..ed4f042b281a2f156df5a2508d3f7c9555258433 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.345,0.015039986742055235,0 +anli_r2,acc,0.341,0.014998131348402695,0 +anli_r3,acc,0.3458333333333333,0.013736245342311012,0 +arc_challenge,acc,0.23037542662116042,0.01230492841874761,0 +arc_challenge,acc_norm,0.2568259385665529,0.0127669237941168,0 +arc_easy,acc,0.5231481481481481,0.010248782484554473,0 +arc_easy,acc_norm,0.5008417508417509,0.010259768981815234,0 +boolq,acc,0.5388379204892967,0.008718633258803963,1 +cb,acc,0.5535714285714286,0.06703189227942395,1 +cb,f1,0.3459575611066344,,1 +copa,acc,0.69,0.04648231987117316,0 +hellaswag,acc,0.3525194184425413,0.004767782256041005,0 +hellaswag,acc_norm,0.4327823142800239,0.004944485990639511,0 +piqa,acc,0.6958650707290533,0.010733493335721319,0 +piqa,acc_norm,0.6931447225244831,0.010760295070580374,0 +rte,acc,0.4981949458483754,0.030096267148976626,0 +sciq,acc,0.845,0.011450157470799466,0 +sciq,acc_norm,0.819,0.012181436179177907,0 +storycloze_2016,acc,0.632816675574559,0.01114704178136865,0 +winogrande,acc,0.5343330702446725,0.014019317531542572,0 diff --git a/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_5.json b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_5.json new file mode 100644 index 0000000000000000000000000000000000000000..5e56760ee878c1ac94b6ec4f8352c4fa1c5cfbd9 --- /dev/null +++ b/1b121b21bc4seed2/evaluation/rankeval/1b121b21bc4seed2_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.345, + "acc_stderr": 0.015039986742055235 + }, + "anli_r2": { + "acc": 0.341, + "acc_stderr": 0.014998131348402695 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.013736245342311012 + }, + "cb": { + "acc": 0.5535714285714286, + "acc_stderr": 0.06703189227942395, + "f1": 0.3459575611066344 + }, + "copa": { + "acc": 0.69, + "acc_stderr": 0.04648231987117316 + }, + "hellaswag": { + "acc": 0.3525194184425413, + "acc_stderr": 0.004767782256041005, + "acc_norm": 0.4327823142800239, + "acc_norm_stderr": 0.004944485990639511 + }, + "rte": { + "acc": 0.4981949458483754, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.5343330702446725, + "acc_stderr": 0.014019317531542572 + }, + "storycloze_2016": { + "acc": 0.632816675574559, + "acc_stderr": 0.01114704178136865 + }, + "boolq": { + "acc": 0.5388379204892967, + "acc_stderr": 0.008718633258803963 + }, + "arc_easy": { + "acc": 0.5231481481481481, + "acc_stderr": 0.010248782484554473, + "acc_norm": 0.5008417508417509, + "acc_norm_stderr": 0.010259768981815234 + }, + "arc_challenge": { + "acc": 0.23037542662116042, + "acc_stderr": 0.01230492841874761, + "acc_norm": 0.2568259385665529, + "acc_norm_stderr": 0.0127669237941168 + }, + "sciq": { + "acc": 0.845, + "acc_stderr": 0.011450157470799466, + "acc_norm": 0.819, + "acc_norm_stderr": 0.012181436179177907 + }, + "piqa": { + "acc": 0.6958650707290533, + "acc_stderr": 0.010733493335721319, + "acc_norm": 0.6931447225244831, + "acc_norm_stderr": 0.010760295070580374 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c252d8f2996a2ce58afab33949ab012d18157089 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c641de271753a5feaeb0b47dfad40e93e825bc5e2569e1769f781e1a36b82798 +size 51395415 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89be9f4888610112255db25c17f65d4cc2f5ee03 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eecf8e9b50bdd2ae79cc3e42170bc8d07ae753c0169e9aefa41986624262ad17 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f09403f79fcba8f0c1f2b9c1c568588b1ffc315 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:739230947f3d3cedeca96ecdffd0df2e5adab1caa3a47f30857175e1842bd800 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54c3cb806f7f27ed60568d39fdce37086306893a --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:175be88a6a7a2cddfdc8926e7900a9fd4e3606bbba878e72a36a0987106abfa7 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..903dc6940ac4f969909639664b386800d1796f6d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1aafd865d74748c977b18618479311a6bc357c36b42e51b8a031c18216615a3d +size 51395565 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d073d2765d8d6ae753cfe0da712caaf42d9232e --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4d54df7c5ecefa44b7a6d026e4aa8ab4dcb3a0626944521d1ebbc6863db7465 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe60438c5b9710f1f8f3375024b208a777e9927d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83c31f467907fa6af8ad08c296dc31752e8c0a72c61dd96454bd9bd9e8cc53c7 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d1c11a6fac794ec66467b06d8e4d254bfda999c --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dff52ee01c8d4bad9c09193690411e71b0536d021878c15163e6c59ddb356aa +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d672e075b9ad78dd58f67167810af7a318c28e37 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4fd1ffafa06c391260ca67f3eb2b1eecfb815d8229e4089a4438f7ea4bd53f2 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f8fcef8fc42623f8bcbea80e67c803f84100bbc --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6d0d0146627128219269fcb3ac7f683b32624d18953a671b803873a3b3d17d5 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e10f5b87f0ad841b6badaeb11805b5178fc47e66 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e27339932e53479b04406452d8219cd22d5b0455616f2a44d39ff09358fcf41f +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..800abd4c4744c611cc4c8bd8fedb59a99b2c65cd --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:139fc149d74675075f4f4261670214f5424826482d30af93a388edfb0aa1c22d +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e23e4e9c0bd3a4592445b93b4f501f2e6171fa1 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0302b3a600aac2bd4c1f7066ad237e62d18bb001782c5cb0d771a283e31ad9b8 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0836884f46de8dac4f7be3b43263dab865618a9 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0576cf01f68628dd51b9600920f34cdd655e3dc50f57732b06f2ea6bb8d380c5 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11b4f02da603ddab46d20aee0fbf32ad6425181e --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:925f79993126efceef17609034f38626e658f7d28b99ac83b5809fc71b4da9fd +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ce02f085cc822cb8a2ffd12bdd26f46034ce693 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20fe1db84f9b5951dea2fd59eb5c6e4a6b2590ffe490913218a6bdd64bf814ea +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eaaf71cde9343c7061429d6baf943eb0b3a46767 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b2f3aa4191bbeef98d43d12a8be1c8a9a353ba6bf5b6bee4f8a80e55b9df2f5 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..925b945ab305c0a6752b55f04fb49308d79b6ce9 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc3c4cfd10f1dbc42efc754b31f2b61ee231a260bbafa797485062916eb49405 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84219995066e4e70375ac9063544ed3a94153d23 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:770eb042a014aef284d47b236930a15f857422198b422ca1025094cdb0b6f52a +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17750cdec5a79a3fd418b6040ef1bd7ec349d737 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3af73077b66d3a4e5529344bc65e96ee81fbf3d0f685af923eca938d45c7072 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43af9152fae6be1bd8cc97a213b715fba4aa265c --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adaf14eeee280819a214f61eb4231af224bbce7a77cc7a8929ba2bfa42b5b6f4 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17105530b36e6a5722a5d68b0d3ee1fe48fbce15 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10532bdc5f373915c8c4e227a33c63e2b264daf4235fc59d2f7fda3bd9c601db +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e068b55519f95b016876451f5560621849c112f6 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c3c96bdd551c3206108c2098a07a0638a346dacf2b883f7c8c00b195e4980d7 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf174b9b668ec55c3f8d4dbe46bbf3055f6f9a11 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d2b6f726d8a3feaa3bfcd9df923cbe65f10e120630bff5a10dbb7dbc6625bec +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85aa166c5c0a909d7224b37ecf29632e6442c964 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0178383b51df100f4ecfa115ecf5c07e46a856344e397dc711781ee6fad20f97 +size 51395565 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c33a1b7e428d8983a3d2d69ff570a6d9d3e884fc --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6fe4ebac77d6004426198f11fb5641d0122a8b542ab025f6ef6a70ec91155d5 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b069da3e4e0bd09f9250eca2d62f29dae35a6a68 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3f5210ed066f6308abbf34def6260c4ca2d46ce8b22d68eec6a750406f810c9 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8077a16e9e208271b5ef339f7eb439e7bfed408 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3248b42fcab3d931ef0f16c8ae48de5d02628f344c88567009d0aca7b83f0b35 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e007909196e9979e05220f986c1601f3c841e58 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1cab9ca040956953198c88f9432cddd6951db458966f77e132db322c435e2bc +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2996085a6dfe9991a1cdf5b2f002b0d52897e729 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b82a4a0c9777329783885c2d435f6fe3bf16a42149bb9e098b8ae3fbdad27f76 +size 51395565 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd17d310888cd3422cf331e2b3923553679fbd65 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2164daa56a76c59b249117a76dfe84f3c202a2d9a32539db4be3c1ddfdd2f782 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c734c70936049d2053e90425d91cfa5a7d509532 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a1bf62da8162b0d542202931d90043bd413ff6441a4e79e8e6877a27ff7b208 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70272565d25d2e1809965bd4edd7e697641fe191 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce97fcab5735a7bb12dd1d5f595ae080cf09839e74261aac3fab885f0fe64365 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f920f623e2e6e59e8dea9b1de75db9a57df5584 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:829cdf752e842913dedc80f3086a29ee16a7be43d6f7a3b29a51e7db333d146a +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54925fda73cde1e23716511c7a393f2d7d0239a4 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e74fc47c4052de08db6b73275ae46ccb7d8b8318fad3d0cc570f01778b283ba +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39ee819827997a27538433cb5d6f11b6f804e311 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03258d61f500d154afb41a6685204e95061265d0f28933fd524c5b0622e337e9 +size 51395565 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93433d96d9a9fdc8cbbaeaf36a6de878b3cf9a26 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4379b7a7e19605e9eec7e7bf290ff36241d098d8ea9bedb0b384222bc187be9 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d28ed2d05137547eb99b9e4b5b24c198a1eaabd4 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecb407501271afd19532a857be91bcf1673a03869f090904442137f0be57b32b +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7deabec17b12de28aab560ac035a0b07269da88d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1f65d82d9be02e72e367b134a7eed8a33af0932e75a296be4f2910d60b52100 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb4183746f916fb6a17a7f964d259586eaca1053 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75856b1545df9a7d572373e246ee37f6539c2ade135ead8b52e65bc265bf4927 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3df69460944a0de80928d593ab92e7201bc95c42 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0feb90768ea9ec2983e24bb1bc119624a093ed3d1cbd69e1a690a3cee2205058 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9cde494a279f774d662df11a8ed042baafc5d4a --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfa694c9fd19d53caa420c21b69ad9b5cc2ec68c80426c3e2a29e60667d1f51b +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d82509d9bade1963b370c8eebbbca52b4e3ee6d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5717359842cce2cfc09f4c1e2937d18237f80cfd5c17ec65b752bb9b9d071ea +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90b5d0e122038d42c4c5102d73f71dd21ee6d916 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28209a326a0119f397bec665f1f16b260e3fdb57c84ac8650308161b6c0cd48e +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87a15107c59360fce15d8d9c2163d6c0ca1ec8e2 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab3b8de1743fb2db15854a285f907fc644e4e9de405fc627d2d39fc0090bf5f5 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5106d7abf3fb31138e109c1561a387860a960a17 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa071b9f794f62bb6421a9252301a1ae932a7035d0f5a871f8792e7cf7aed823 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50eabf6f7273c94b73ebe5935762e9fdda904a61 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4345539716ecbc0293cd2dec70d864163e12455579104376254d67c04e575952 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63930f28e5687d65d9abe3d6e9cf46fb5092a876 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4fa77b25c34e942db625da8e4df1d4f6125c3e048d3fbf2a770604ad5d65b08 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d75654be32ede901747fc79aa74e80678d7f1f73 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:728f2b1c87c08f85905ac00132505913010d0aed8e6bc6d773dd118f1d2d61de +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..892e3b94a0227abcca348a8cfd5011dfa5dda174 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef84accab5d30a2897692ba9a7154586ac7a8e91a0025f4c9af1e5c152fd6b89 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7124197f786d35b173f9b1b4d920e7c9f86fb73e --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0813987d8c44742d0aa5cf383e964d57d8e3e324ac6fd8beb480412d3c2c019 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5987e7f8c91d566abb042933e59d989670f42b82 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb283d264f5d3493e49e532798b7cea3e4f583e6eb034a7f98eef1c1374a863b +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e322f3771ef49241c930af6fcf913150b7c56875 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d74f4b79fcf6bb988c05cd9729f3b759bcfa436977017fbb1b9be730ef3041bb +size 51395565 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4924520d5bdc77e3ee26a646e7878fc17de19b0f --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2f32797da647376a85af9e36d36711757778c652f6728fa8a75bd2fbb45e571 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fff5e8f465ff6574ae61d3d188a246738cb7d393 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed533034e7c711eb4c45919a5043ba507bd1884a59de3a666aad75fc05ae032e +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44aa10ba2ff2ff81a3c2e8023e032d66889322c0 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bceea8e0e308454d6b1e1e267dc68307182e28ad22c41b3e786dbc4a8b04809 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4d06c558f6dd697133a30de1b5f89b346a45701 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5116650fce38dca74437a93ab1cdf8b2fdffa601e9c984936fd32f213f251bef +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9930d87af5a59855c6f359bac28317ef86848db8 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:783dc1a6fcbad27950a4169db54372517b8428d70bb7e2fc49d03806b5e9255d +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..354b7d826b73ea8cbb0c060ec949143bcde85f2b --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b16772a596bc573552bb43a43093a0dd49f008fd28d3c2893051598f05bc56d0 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5967ee0eb810bcbe07aa7ef9bd2c1024740bb951 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5def52a83b74b36e50a566133cc84ace847efe9c26e8fddfebe582deda8f302a +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f87fd25b6c1de17c616e9ad1a409f46ca410e24 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7f835b9283e5165f4fe78f5dfef93ca1343a65cab049c02d5fcfff6b200be82 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..125027cdfb6611428cff81e10a77fba86483277b --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c238d6839a0a86ba97750ac99dfaea41afb63683cabf30aef9142a74872191c +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcef4b1c1d1ef65f66ef63cae6f35bfd36b8cb20 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36cd931f4f9923b09d48cc8b6754e8984b5e020383348f8456bf31016570bd80 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74aedf8f075a5e89c99cbb1ac8c543184ed54006 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12a92d189c44229ce30708ed20c5776a97fe8e60bf8befad3b42665ec33d6fe2 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82d6bb29945fba438d25552c7b2f140ea88d484a --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d641a4efe9cd447f4e8641d0a2aefb87b9c7fdc30ca6b4674f5498eeb6dd9973 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2db359eb00cc29b1631d3062cf0b1ad071a6a51f --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41ad0d554ca03088338bb1e7e98d8f215e633f240e468a0a2a9e3c244abe3a31 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1329cf73ebd98e6e0a4f6af48b52d7622b103fb6 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31ee6af8f80b65459ad4346f8c335c9c4001ae8b194c2fadf964bc2aaed0c823 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1103042f70407c811e644f662a0a51bc6730b8a8 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3637c8831da54d27f5b00f96470947fb17afab435a14e2b2ee94ff0f7c00500 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aee83c10c24e69d93855e8321ef5594062185e4a --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aef430af90fba60c2610190f73d401c476ffeef795ed62746c6ba209cffc18b +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..144697669ffdb59383c275a137a0377e295c4017 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e11a1fac8983a6ea088dc937ecdb9482e9c0f1235576b5303800436bc11cf0d3 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bec64eccd0b96923595e3fe0df3a583067e90d8 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc56a0f56fa01da8008f265cdb71db7e1769c4f8221429c9a2fb0602b53d0368 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58561cb03c2a626610b89950b2c468b4dde8b63f --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e821b606bb67ae64560c91a4eadc57515b0848af453d767412288229aa6dc266 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..faa51e7e2b1d28ba3d1e652a1581f4e48bc97be6 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8de3136322bc181e8659fdba1b2c3a1bb8906c164c522879bc081e5dca1881d +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..781bcacf318169dc68bd4109b50a6518f03c826d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:178ad051a36e47eabd4dd86595210f5e8f3c97ba8cb24fc3bce6c1a44cb7cd38 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a30db9b3212d60db797d62f646a5d0450955ffa --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc07c63a549867d0fb1b1acaa992e7eaf0e949ae56c5cade0bc37429f36310e3 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d09a6842284d404dcd46ecbad38037667ce64625 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4124b732cbed2967d3e83303bb6a1e3b355b0824ead14f60fd52d850358637c5 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddd1a69cc2e3e9197db641b70d463bca517ddb42 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:604033bdefa3e33dc59011463a895aa342ea0543088a2cf4b500e2029195a24f +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb55399b04e43e2e5c2fddfc719655d7e40aa0e1 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b2db34c59cd5e59fb13c823e74b508d92d0b203a79d3a0ff7c5b3d8d26ba202 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca219aac56fa4334fff62ded8fde3ed844ce78e4 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:711da3154f07596de7e8e4995c06bcb6ca02daa2a983ea975d06018f13f03143 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e79f2e3fc60182006780bd3b95bd4d42137a1e43 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fc209ae868ca1401ccce820f1c71639546afa7097b74d84d8a20e1a3f507244 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..780822a4a66e97e01ad9c5e0664382c4baa66f83 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9895d9d306f21b4e25ae0e7e95ef8f3a65f1db5eed0d59fb88cfd49631d8a5a2 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72b0882ec2b0486b78b08d8aeb9216f934704a42 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d42bacce93fcac7c8d61c516996829b815541ed578468d862df537e01863fb07 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e99a065914240772e31b081b69f76a0f0aabaa9 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5b87557b4071c3477a3d47197edfa22cad4385c8a12a9cca25dbe42de20ec3d +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23e55adc414010cf706713cf4520597c0772ee04 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:329081dd6fc89a8e6210036389ff8ec0b526465ee0965160afa2162b8d52c3f2 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..793d8579223d17cecf05a5866d82041b5f56e7ab --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60ed024ecfb0ee2bed482d8606f2fd7bb00e185c94356ae84cafbd5382b47a2b +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..969ec20bcb9fdc8288b8db5ded93444a45b28db4 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed9c11c7c2740654885141b0bd0fe2af78d21548eafe9080a1e47fdcbd165fa7 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2e4cb7c83c0454fa0f8f660d8f6a5f64b953bdf --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f49a02d234e42621bac3cd41bcd719bec98d3930a4b8594793d69d2f7c9e40df +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..927270538409b5de0071b125a3ca3dbf48b4ea68 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b589e73d4b145fbd84366fc55a05644a10d08a9d8511449e22a15243a05f56d8 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cff3468a015068949e8a47ed271620d3ad8fba4 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c93d8e1743aacca25d65789c3275804130a708595933094906d1b08551daae6 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eff5f65811aaf6c491afbe108c25a157554fa30d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4018ee696bf34deaa33242e541a860e1487d33ab4f3c5974c61c19008e86f5df +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f9e6a44621d2f14fc17f67549b978516a1f66ac --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61f310ab0d3856365aea557848cc724fc266be9ae5ea8c40db796abac1a0cf2e +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89aeb52b962e0788755cba4ceb312032e89f6715 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20add8d79888335980223074963f1798979ddc15bf0df92c3795966373fac566 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..905e749782dcb49a3d027d7ae3e75f26b56ec165 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b2fef1045895e0de6c5265031e322f74da0727fc6eb3e652c4249c3bdb69823 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e171f70753832a2441f630c7d95d43976602cd5f --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7cc90a1fd98033240cca8841d9273cedd78bd92539b76020466b7498f74f553 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2418694e2c0e9934669366dc79cd777ffd0b8e0 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8096c4ebc8b5b4d0e35b71413d19a5665c7134bfc6bd4ebd6e21513acb0424b8 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..163b172706e27e4f7ceddd3dd2384080addce975 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62c7acbc3d8afb5c932434cecead4b34c7df5c5415c0f83a0effc1a0fc08966c +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9823b1c482e8c0ac511acd4f6b6446d657d72673 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eff804e11d01d9840d20634849ecfa1c33ebe4e65a2375a9f5a73a46a8220320 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac986c57bbb49d79595d72a41a1c2023d1394356 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f124923dffe921585893449fe9240640ebdf7af2fe62e9de2fdd38e2c9ae3759 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc82d152af43d6467096b3f8d7605b8a55d89827 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1216f3ec00892e9bf98511ec97babf4a04cd5de4b3f47ddf49ddb4cfe97807e9 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3831ffde0fd522ebd5e9af5b5abe57abfb6d9afc --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7260a2e469448e31f381147a4c6d4027adf28f2e48a652a26a5e907690b6430 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b6d50105e4bb243e0ca0d2dc57754a46a1451b4 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e837d066592dae00a3b0af7d6485bb3b625d204eb8c55bb5430b5b1284213485 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee7ab7ef336879a9614d70a7c02eb942edc54a2d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9d50f36ba59ca97cb8b7f2c1c4a754023c07f5da03d34489f87a220a1bce4ea +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..187f10403cb92aab148c51726d889b683e28e1db --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6878f57588207ab1d658873cd2c8ba97043f4e317a0decb778054ccef3789ec6 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..078e57139dddbf8da0be0658b925531c33c9a49a --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337544d29c2dc68cd533e22d9d59e5641a086f29a1dc91e303aa9924cceff1b7 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7680262f64c246301b33461524282eecc7c805d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3e3f9636f54ec7f075655dc59cd8ef81cfaa73df9a408bba1df8956c3ec2c67 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8841a55ab0e53aacfc74308901e9e05453ef1079 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72f4c31864f0b8b689d4048f7ddc42dfdf4fc2260d08d926d21362183d3760cc +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cddb273bc6f35b30877147dee7fe60ffce2594b3 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8b066c6e2a82f63c8f256009aa4f6b75ae0a10f4e4a4c9e9ed5d0341e175e7e +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79c4c54d3e83f314ce36d91c72cc470ef3737de5 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5c1cb00f8cc0be337378504bcff6c5b8c2fac66be1642de86c9a15e4dc0346d +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54d29a5478a6babbbfc1e8c5afefa45369e73ba7 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0c7901ef26b6ee143ff19ed4c46cf6f86ecd3c65258f8ee86b8b7527e9fe9d2 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ed54b364107cefa5f5fce0c236a7027da00f578 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0151659f3008e2472d368e389307557f5d9a6dbb73b32e73c2e167041cbc800 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22b13f23250f6fa3d229b10acc1e73ea980000b6 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c1898fae7afaed548e54df355b82712312ee981f264eddc5b8af054d39bf63a +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..453198d57b91921a4d64526edb1118637651cf00 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d21cc36003e2da3ac087851a906da0e0fb6a66653144125539277214cb5615e +size 51395415 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9173c1cc001f32597a67a51ef0afe45e0960666 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db7241d29ae4ac65f81fcd05b31958a525201754634f78cb115ee77254f90f45 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2bfdc38b902572d06dc5f19686e7c11bea0fba3 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdfc0388911add746c8e14003ddf7fcf10bdfaab3fa82ea71dedf7ae5eeb9bf3 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee60c0740755d61f19b3c2d7e5bc0ad175b3f383 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:043993c569113d76a5cfee97598ae0c77b01079d4cf43233a0b6dbe72d0da823 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6f1b2db53bbc65beafd3beab5a3535ca84714e7 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86e34615dfa50cc7dc5240e06bf00bab7907fbd61741082ecb998339fae338b5 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4c12db89db7526a9a3cb58eb8db4431bdad4876 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e13fca263d2b61e5c9b3bbd5932283504617ad8869efe18de169f985da2811fd +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7584caab1ed1eb740ba33a9159557cae732d9ca0 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:925b7fc8d0efa7a1882476e9531b7c3d1da344d2678d7d82892a611c284241c3 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceaafdd82c2ef42acaee1447989e30205db81548 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d53dd50947b0c5e4e79c55ee23b9678d567b56c5833d25942461f6e71416963d +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67d0382680b8fcf37fb0371500e34f9f59ecc57a --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c4fb6b12568aadb3e530eaa35f4742d7e253ebdee96231b3d930fec3eda96f1 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f3bb5144c9554c0cc419f862aeb345f647a43d1 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:441fb6ef963684204272431cf917c46590977dad9b24256600e3c4620da55093 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf9da1d3be55fec9db17d09adebd416d96e2f8d0 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6bf8e0a42b83502120f927fbf7497f7188478ba3542eb39f987ee0a7dd09523 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..934eb6f7f007ab9ae6fd8cb8168c165e0ac3bb46 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44efcd9b812ab29a7cee09c9cf044c9f83feb57a0a1a9b1b942076a66ac20ac4 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b54bafe3a1bef79843cdc31eb25d3baf11f510e8 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1521bf2cdbf1c6b661dfc0eb8eab0fd4ea71e44df1463ebc3ee58d6ce1b0aa29 +size 51395565 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fed3502986d646c2db146dcf333e9d9da0118a21 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd28cf364fa0373b087b790b000545f72bdf90fac90ffd715e6edaf5e2e02993 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddb7a737717312c2ef31c738b94cfb4c231ec3c7 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d32d5a232b27f6a9d36605d1ec13e4dfc8588a4eb7d9622983476e83ba2ae302 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe40af72511401cc5b47e60d13272a5550ac32e2 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36b32e9f0ac679903b3a28f8a1f319cc6f8f8bedaf9dd60a09e7d2d40e2894e9 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ad7f7c0dd8e97f45cb2f70e099e3205eafe60df --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daaa7241301d6da0695aae4a0f177a85e1bc6feb972c0a2c9a045bb01442c6ba +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2daf3876bcd2d7f09346c88467efa951880c122b --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fd638bde8f0121a9bf5bc4b8d55410ddb66ad63f8806e50132c34e1b0f98b07 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b674858aa8000c0f1ffeaabb8318bd19d97c38fc --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d85ce40a8c4c1fe647f5c2459c5abb594538becd51651dbda871903559a6fdb +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..232eeb7f9ddfef13812df475d0694d1d28c41770 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:977f99bcc66e68007837a4d3eb8b7d3973504ee877c56578b4174c4f69e46778 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fb93303e87310f56fc415482403d4c7262ccb77 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e2bd612dc47081222226ecbb3d98349489f011c01cdfcc336c766f6c2f76215 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e9ddbd57bc9b3ac6e75e68b01e1cff9c4f9be03 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3226f553ac9bcaa851d4b8fc52ec29693b3775e5fc64df73682508fbe4b9fc11 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ffbb452f78a88d84737c87a3f87e2cd13270d3d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8d3efe722c6a10e27666aa1d490a8de6c256a0be32479220ce53db1ab716a12 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..534b382a6959c84e8262aa851063a58660af20cd --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a35f614669322d4590ddfee1f42b47a98b6f5efdd2bfb967148831630bf406c +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90320fc6294bea3e0bde9e2871448f5f004f2f49 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:093d90949867beb880787e58505afbdc17af501a4b3a9ae0264a45c949764dd2 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c9ea595f5d861c818ede7e1a1679cedd7ca975e --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c01880539f0b38a43813eb37a580850d9d53382e97854d413659f149a34216da +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9e8f1b57b5159e8bc066b7b3fce8ce77fbf0f1a --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae62c9a56bfdde710f2cadd3b8d0caef3b416af0064e469cd8c2551700b9f7b8 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29459f12f4512e3fa65c0d4352258002a8b88779 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a513042bfc9549f3949e437880b293dd9b2267130afa45bb95c0d0843883561e +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e81788345c4041773fd1cceeb386c586ace3a44 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2744939ce2545f844067429bbfe9463b69ca242ac422872b7e25b54ddbd20d71 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cf84aa390f7a67d06d666d6d7e5cd3cc30f44e4 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:901be3da13fc5952c249d72fa8fdce7feb18284914548184c35676542348efc1 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..739e50c2f474eed38398e17317f0f72ac64ca6c7 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:663e2461de74928d1088db48e3345930e3c0c8cc2e21bc147be4438a5fa7d48a +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db00064855b413b7b61c915f8705345762d1995e --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e73b4dbb49654d42915033c8a38f19e0ad2ec10e3d1d5d299b1b3d4f56c9e4d8 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..955690a769fe4d8a6275637ddb36190dee4dcff6 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d6b02f298d043be99f848acaff1804d1e66b5d752ad4934436c33f8de599284 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a24a270573811c203762281b3abdd36e85b86c66 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da1da9cf6c408e535713de45d02d4ab05f66f6aa07cb14329f988eec3b426c93 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f007f94801c2c6b77ee97b40d7a925827073db24 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1afc53813df3968a734331a50cbc0ae94db6066037775d217d56835e0285ddb2 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d308b4931668920160792e412269ec8a225c7a3d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3f9b5c8244c6f94ad54be0c4394d1980d252d5f2828f94558ee0714631e8233 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa063f90f203266e58e0ca36d289d112f248ae0d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b200540d505ee2349101a120c07bdc93a34c3338021cd7f5c3c4f66fffa5a27 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bf8273b9ce7c631752f5c7a4fc9473c982ed939 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:106c93ea31ce4f07a1a3da3f2c836bae9cff0b025c56e10b94fda15b53afa59e +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d48dae73ffb6fbc309f7425310fdd3c3f396b8b3 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4bd2e4326f396767b03b787efb1bff1c036e4404bd6136933e32254e240b911 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a57378f3330aa621a4cca97370683d924940fafb --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:654e0d1554e48e0d877efb9518c8bf2c42eb5f1d74a14c6b7bef4586a650593a +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e57c67568a7df2d9b31d90ef0b2529a67328abe --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:198b5db7c15bd35c5bb86b9fe4a59d13bda28c560c511dca354f98170cabb47b +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c61c156299f9d65c91724baf86a290472e50de00 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e466e3a5c88dc80f9573f93e2671c03b8efc97ff9cbf4f5a39ff2cdb2c014927 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c099269835f6bfa735b7e1d5158f8b1420adff9b --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93ea8bcb02d3b16ad967a56417493f01a99af125bd0635938171d0e8b332b611 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..845f6b47fc64a473a512f840766a926c19197e21 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58c81cc019a4e5f8e6787fd8486bbed099d9453b00d31e0819a6b44e807f6447 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac562e6a57bfaecef1e4f4ce1c24736b196444f1 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee45b3e616631fd8e29ab536082f81597273c11e42c16be5c0df31c24b8f68f7 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d02297f2500a763f82b9a2a2452d57f4d4a139c --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de5bcdd41e8972fb922fae9a5675a31391389b9f8d842bbfde12e53da4d2b29e +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f17edb236e89fb002cbed1698c1dfd2d75a89854 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b341efcdd46bcda5ddfb5192cc14000f7f195884a9b218404cb88bbd01b6a713 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34897d4d7bf736c0f97195f933ca0e4d3069d3a3 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0691bdcc257830639766e8bb85f61fd860a3a59911b764020974657f950faad8 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb49ff0a1384af95f252cfa1179e3f8812d8205b --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f1223347dd14931a3ccbcfbcc711e9cd88269f180f56971d6bdfc393217cc03 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..412dbee1568e97b66f8e31dcdaf09bf1d45b7fc9 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f41a054ac0874b0c949b068559570a51c1aa414fd5c5de1bd554056bc78f55bf +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..353b12907c70ec099086d86605cdcf6389dfba83 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c3a004e3c45e3c7ed157439fea392bbdc32412388b637f3c51e0e6b7795da68 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c8a07a6aa41fdf284f09e406788f816f398c06d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e022f395dba2097fa2f9f537e91250e3b3d8285ec3139ba0563a5b0cad5b9be8 +size 51395437 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53d0c2e52e24aa5e9af1ef4523ed1c33d45aa774 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74106628138ed06d44e4a9ccc6da577e88a89079f85d7ce49247df0509373074 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c718cd9875c040611768d308e64a99ca5b3bae8 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a38bb61ca07f9eb10b4cdf6f2f30a9629ded4a58f036c131be4a7c5217e45ac +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2991f676f7389262a0d1602e388bd1cc5bd4e7c --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5477eab3fce047a3d5775fa98377e118efba13e769bbada0f24e50fb7ebcca58 +size 51395565 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58a590c64494d2e00a920a25254f7fe397f5a4fe --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40c7a23fc4e4304efa0efff2695dc871853aca62c790c63868ffbaeb3aaeff03 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02b4b37e43c52bd63b4ed358312e94aa778fd1b9 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a7e5f39903f509477f7c6d6f790d2b9b33c033169c08052f7e0fecbbc3a67e9 +size 51395501 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..631d808c3b0560dc7842e169ebbd56ba7093203b --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa3156b5bced6d82b0b873741ffda013228a1165cc119b9037c99905a84258f7 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ff105796ec095b09c0418b87cd8dd69a0ebcedb --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6590ba15c9793cee41b22f0fdfb889a57c44cf1a1ef58f49e0971e28307a56f +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a81a6108b068a9b8bad0021734ad0dd659a0fa2a --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e400447db06e981f6d7a1ae2c4caa701a90ef505eb64d6a2db01405b97a57f9e +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a55378b0980a907f7fc35c7745ece03a5ddb7b8a --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35a7261667b1d100d32afc10bd374692e83d5983597bed34ec424c298409c892 +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..788e36743033a92b56f261b7a7ecfee13bcd40c4 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ce0ea7b1943a295879999061bb0c87ab45281bec1bd2af089020222405123de +size 51395373 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c82f9d3ae182b272a997214237d0206c5aa51dd --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b4e67c4fbf3124bc083b2eaefea7cf946dbdfa556b13641c74d0827d294283b +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d215b017d2630c72f3138014ca9f0eb66c83c50 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:317dc2808b0514ed9ef20d4071dd9e68f4d3cf928f670e721526fa6361a0ed19 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f843698583c5d8ce128e971d8b9e1999cf510fb --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdcbd7d1116e69e6754b789b19e3b31e708c67c3d78775f011e3d0c47be7a70d +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6875f458b09277f9279721b6fb5348ed7dc5962 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b96e7dc49947d59005dddfdc33c3c6d577d4cef6ec21eb825f6a5d17be1f5c38 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1481832e7bff279f06277253f30151797e8fec40 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2827ad79dea914769daebb239684d03f0a87b5690cd981c3f0dfb5370fd1a7f +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..500d762ea409ed70c3ff14baca692cffa17ef622 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2fa599867cedac105592a62436b027689bb0a2445510e4080d356b70651b56e +size 51395351 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c887719f090076c199e31cb6f1ae716770bb59b --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ff39fbf2d2d89f2d0e7ed566c55749572f67368dc53f40eea7bd156f4021c78 +size 51395554 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..707a7df707e6dc3073bb49d307dc0d496b2831e6 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdde174cd8300508682f1fe793f13916fae67832afa9205953c31cbcca756b52 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4af417901a55acfbe222b1107027a916fe35f449 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c8f618b57ac36caff33b0dba277fe9ceb42679948fcf257766a17dd19bace1f +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c237d53ecfb7a6d71bc663e331930cbafbd5010 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5a12b01d9a6166a308514ab610ed30f2006774a6d35f586c154b6554e768fa7 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23afc0d50f73e58697d05b5a242d0542a322f339 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42287ce232a8c8a8808a4b1c9cd205ebfb09e633e23a1cc87481fc22a10e333a +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcfac87817536155d0025aee4202ae79f58eec2b --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6657c736b2b206c88569fc155256d7d132848f170fd2dd00f8f5c25aa1c9ea0 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff5e3974c4d2fac9d73e20aff4ae6ed04b535e4f --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9c2306204ee93645d4c56f02c523fe1a26ceabd4fb8186ea2169746d178c859 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..613e940b12690d488c7f4f5807208e971dccf875 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2f5ef83b6704b186d1f402b0d0b40f651c2fe65b72dfbcb85c14d490e7e076a +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c5578b98fa4cb4634485f3769b4bae89eb4c46f --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65529d3aadeb1b5bb22dc2cb6b43a8a47733958016e3ff9ec8964fda4d02f088 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5050910752adba219ba9abe96e8a126e40a4c0c --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa318555fbb93aeeb35ec672e4f22956e0e733bc2bf71ddbe2036122aacfcf40 +size 51395554 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..247a6ea365ec5fd4c3508ee3514524c48898abbd --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7be1ada48ed46f1b65983287ccb2ba0865f0346f07c11dfab4385445cb72872 +size 51395415 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5d7f6e6b2ce455f8a5e083d6c6cc2f360f04c69 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f08d036e1b8e32f7e52bacdf24139c1268a9bfd74696b8d7b29bcfb463225ebd +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ba23c56f09cc526b4627c7cc38d407eb265ce81 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc468ca646797e75e81b3d0869ddacfef517cb4f14eec774fb72a449c9c7ae6d +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..416616514538e71c5408ea9eb8d189cd4580c764 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:333b8d4d6acf12aa53decb89c356dccda769739ec12d44a341b7409e53834915 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..997bd9ff6588eb2d6b6471294f7d303279af404d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b442e2906da1746f6e82953a8e31c5bc289ff2dea4859a60178f7ff269e97a5d +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..784e639479ec427515a71116c7d76b9ff4111ba6 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43a8f7eca1a9b4867628f0a72bc5657e80400caabba4e56192b1b9bcf38f12b7 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6ea86c01b4c280245a0a966fad7f1c92b4d9e73 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5631da54cea24a6e8977b0c1b3ce9be9044e4c9af9fc6009ce7038fd484628d5 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79442a14db9da3d8a7ce3e2997ba556250313880 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc9dc224cb7a7588434b1dd27f6260e7674e344c4241766c28c5b877d585dac7 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba63230f5d2bb3a1502de35fcb713b7c29d8d7b6 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22009d8402eafe55670d0d927e7c7aa4a3fe1b790292d0dbe4620faef96ce7a6 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a141bd9466fce3b9988183c140a92333d68f805 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34541d35bdeec2896779a951e2ccc9af28f7197f1943ba90cd2447d016f2fdfe +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b81633cdba86c281aeb2134d38faea151cc4694 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fbf04d384d34b76781670bfeacb727851d6d8820e02e2847f3f68f00ab9c64c +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c18b5352d3be860dd4c08a815329ec8e44c2aef --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:480cc1e4be1fa65e920768c459c2b3c8390642a03d9ed751e06724483b97d33c +size 51395415 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dd4b763ee8ad7765e7d1aec993774c2fad2b20c --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75e4f84dd700089b7a49d61e5272e5b3b8246ef13e6b8efdb294e68a6f29e8a8 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc3f1110c8a7404264ece7dfe91a3374bcabe0f8 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0192123dc5e4d53ead2e11c5d29bcf4053dc7086b65a89f336178355811d866 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c44a931b440fddcec009563c89097ef8c208b2c --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1eaafd42ccaa1325ae4c65e1b370f4d229860dc55238060f325c32891f7a8a6 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e0f62260c2a8355cb102dcbafc73bddeaf0ecae --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce0b4b0ff84c99d786f9d2e8d2532fe89d96db60030c9f3c2d0d2be8751f3fa2 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48398ce6b353cea19805ab87129d0e6e35a31dff --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b476184e7d6678f3298eb95ad059009c5d40de6a3e59be74a1add3117b7a97bc +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6afa0852af252791dc3b5794e65126d2a023ad3e --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df92e907fb732f0fe69e8f2958a8b2571a7734418b0045c88355bc52fa7eb1d5 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00f8177f862d229de80b5e33f19c4593d8d835c0 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69f76af28fb8ca8f145c7e88c84fd0e6a2ef819e2f44342da51fb2455e78632c +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b1a7293def1aeafe3b4d0a8aba80ffdab6783fe --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5d6457ca78855b2275f102cb99ce937cabb456e141e48ca01d5595ad233d8b7 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8793b7719c1ffa1f443ee98785b91a2ce6ca90b --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13b78f5babcd17ec1e3e15c7aed0513326f00751fa09de02c173537d20324add +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d725320ea264e8b027f437d3bba222acc5e4241 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb4dfa80c59779cb5fc896bf5a21135a06c42ced9ba68e88ee863ca2b2f678f7 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32b02ee9845abb7d458dbb4b249823a5a6e24d97 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b1bc5597b3649c1dd15773ca3c1619998fba02ab0ee404c31a3b9fa50966948 +size 51395415 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57188140df4ef13f7612781d96d86eff7ae67fa7 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d71b4f246bcee3bb65d690cbae02e39764015a0a801e8ba4bd58e309f9ac760 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fca1a027eab377ddf641cec02791216a95d625d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:039c1101aa4965172365c497341e412aa6859912d191a621663555b76e321c28 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a746243a477588ca8f9508dd218495a01cecf815 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9a8c4aa96b89b5df2300138fb9065024507d27824cd98f36e849635830bd247 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5040c5b4139742b18df47b6eefa44c608e00de0 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90b44e06250f49cdbadc13f6cce8af6cc9a171bec5edd9a64153edb8b31316d0 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ed03f957e6cc5d8ee934deaaf0c5bb6e0df3112 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94ea3072c330211769927b389ae69802c087290d69b480c735de3e18b70f0992 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40797a0be6c8ca515fd6f4ba6e2d9046f9f8d91b --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06bf7624e8d87718637a2b867ab69d6b989e6da2563fd026c9a85485f68bb886 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..955bfbf6cd16a688bac7a6da9d3a7672018bb970 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcd16e7c6151d21847f10c89189c422f8c8511c9f56dce6731e26314c28c6f63 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..979236add1966b0feb295c89449dc49a7535adea --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e705cf2f8cdd2073fee67fcc436ecf9d7076e648726baace9053a66131a1f67b +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..847b297a520b7c0dc6e5008c1c9557ef95a3f6d6 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cc50a6994eda5b8eff26fc77dfc3db7c1b93daa96f9ee1b6b5a1483db3af0e5 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5131c94516cf2389b5a8f643df41f6986a80c1c --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6030df6e124dab53ad5860f2b1cd58d820dec4f738e577be68ab2abe9e29478 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a409cd09b0f8a313d99bca87728cec6238ff033 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d39543634a11e124fa650110a2286dd46ceba6e9bbca1edab99ed10bc9554d90 +size 51395479 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e2c14342b6c85ca08f2b969f81bc9ba53e2fe21 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89c29cb3819a8fd1c1b9e551b34b428de4e29b8fc7f8131f694a2a09a3426fe0 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8b6106504e7eccaaaaaa3fec4b28ebb504977f7 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ae71495c95684f36a5bf13f33e034f9e04011c3d27b534f12ab09e9050facde +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96a897a73181e7cef9d85c07b57280a987eb0f11 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80b86f35df20fdf3aafd69ec99de217e6941d424b396f62e18acd66e47968bae +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89c1b9cafe6b4b0fd33101ae89fcb1a4631d5d5d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20dfa3d6ca6bb7891172586b8c4586972563779e6571c5c1c5ec371583a2b818 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff5224424b7e851f49af4a68579b9c7c09bd2bc9 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6e7fa103c5f5b66d78892bb418d0fd6e55a083c7743960be5f1894c51a1ebff +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..777d0beffb4eb2f88ba724f56537bd9cef12aab5 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73cc48be0cce0d5837a3a0fb232e893312f1c4bbd9c83443e1e417cc8592c564 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51c88577c58803cab20fb191237409257c1c3680 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:609c40ba89cd40bba3e5ed7dfccf8310e870ac7b6a8972ab2523b188f3101f8d +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4290aba4492206c2d4f8fbc37b0f0d7a4d7171df --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd8068f7cfad8dd2e09497b8c700bce52f0dbd3072c0458fc28d4de45a6c5885 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac7d1166ce4ccea7036ed9951ca3399e928cb3f8 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbc81d28915eea5a253e5c8404e024d855aeb44abaa93cda73d0ce00615f6aac +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3b0b14a01d3378b55ab06f2fd6955a79522ba6d --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0684521f32c84dc346a4032ee627ea75eac6aa90f79ca942c198a3a2c77031e0 +size 51395554 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53c6f3d99d7a01fcf3c71c9a480d0db92d8b1be4 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc7d4cbbc1566ab68b6c2ddb42798bb9b190a51ac239b0b763ac7e556be48522 +size 51395351 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90edc9e38564964d4b994a6eefd2ee24262027bc --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:044e9dc285f219c807b8fae9ace6fc5161e4dd59fde7605f532c8e12b35ec077 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6347f1bae197e8a64bfb6169ac786601b69ab0f5 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96763951d3f42febeb7672a346fe9a626bd447c1bd454923c37e2f877796c5b7 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a92281f4e94a77ea0a0e49442ce7e58a1dd43f60 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ec2a34625dd3052c1b82c7d0f110149f74df7a51d3baf2b566605ba2a217211 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ce981d388391d00b5edcb5fbc4fac13274e459e --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d04c1e0792be705b4a1072c89f1bb6b04b69e01094becc6eefc8f171c024eb3 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2907e3a4377deb62205ef000d40e4e0ad3a8f2ad --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50b478e6926bc2cbaa4a681f3af4ace16197d8de12004d9d8f8847545d2e5f6b +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06c0c267dba9afe9e317ce95176b3b32c093ff7b --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89d88bd0c6c92c2bba2e915f6afb77332ca77c5cc8afd0a08025aea6c307c773 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aec32ae14c42a76212ac827bd79792f2ea3378fe --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdcbf1a6c67d8a5ba06142b57f90f915a3867a477ed11b235e410785ebf4df94 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed9eb7c0096f8b5af8258dc7cff4b55c34f1cef7 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77c4541bd2ef21d9006f84a5bc0bb23b8158338c2521df240a8d3a216f3cd4c9 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80f4d740e4ed9ce15743608b479b610a734fee77 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:086ae545b4c5ad9a16e79541f07c847b28d379f54605f1adeb56b0c8bbdb917b +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..414832cbfbc1b5779ca6825e80b77d6f26aefac7 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6a67bf980294770adeaaa3ebcb01c4055480babc069beca9d97d8eb6f3bd4ed +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d598ab3aed92d65483536b93b20c44fc7c398253 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b08f15a1cbda6695e1d7eca18eac88a2de804be5505064f7e0882e70b5a8534c +size 51395351 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..064c1da926e6c5c5f10731a99fbc6499d505c28f --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e381133c25b284919d7eae0df1a55854eba54d1058a23b7763b700331bef2d2 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e7f8358267e2212d1957bcc47b013885639092e --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39dba1dc5e5e336b70e30441fdedf35d00b544d61018dc00b9e46f3e7231a724 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..416cc83c0a9d9b2eface1fcf5b913b93ce504615 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4744322dc2442263f3541b9976f0017633fb804e46b740d6c38f585149dc7100 +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cd12c515f7b3f5b81016d235a2642e694c48cb4 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6d84114325fa44e0b943563b60c597f13739af82e01b0391ebdd36a0e648341 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..732e42aecd47099a86aa30621ebaaf846edbf750 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5204af8b11a54ef182a1f5d258d512c7b879050a0f278830ed72a824907b576b +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f012c89d05e05f32b954dbc39efa9a488e2d229a --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fe704871bcdd5652afb22c322bbe236c02cd560034e842584104dbdd2c53ce1 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63638e39e57e70638be35bab64cc8db469127c1f --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48489ed31cd07ffd45df0f106a087c0ba81df9e7ba1cc90906d448fd13d4f165 +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..963c91d3d76cdee9d709fedc28edc2a861b7688c --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a748c32a7981ac374406a1979730f9ba343ced342e78fe3fad010576e204be7d +size 51395490 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f6726a4d16a0db6eb5d59a6ee6ca96feebb5a58 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32ebd5ae18386936aec3c30af840de167d9d391fa2e28ecae2e334308c8d1732 +size 51395362 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d21ebf2edf26b40e6f1536a6bb8c7df907202ce --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3b175a6fefff669cfe36a0aedd9d8f223074a484e22d70ded5e37a0ecbdd7de +size 51395426 diff --git a/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba41db38dd9b4e29156e99ce07b7ad5f03c3c457 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abcbfc5ddd4fac4b702c316bc2b8770d029a7648c4c6923169110088be220ab8 +size 51395479 diff --git a/1b121b21bc4seed2/global_step39672/layer_01-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dcad324f00eebd40ca931f68d013199de12cdf1 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f7465f9e88ba2c9a45b1fb4bfed92e9de062635d15493a75bedc7646ee24f48 +size 187630851 diff --git a/1b121b21bc4seed2/global_step39672/layer_03-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f78f7bc8843c6a4d744a703d4778b040f783fb6a --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eeb87adb6535cf780f7c3f518062677a5c1a657779e76dfccfd23fb347bf4d9c +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_04-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2ca6402e7b7cca2f8e3d16e7267feeda2efd0ad --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7e2da42a7145e7415327248c9fb9bb8179c01ab1794de26330a0a9981b55020 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_05-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71e585b9191a267792961a3737ceff8f64e97d26 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a32e47909e192949f5c30305a50b13081ab13c99056133c5ee4727c919d9cbca +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_06-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f596c66270b3f1596aafac983dfd9d0d4c65550 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d2d461a1c15b5838397863f8370a18c3ad3742910a9fdd6d37ad38645214af2 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_07-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c37a24ab5ea534c4915597499be8561d1d4637ba --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e647379ab5056270f67dfefd2f5fef22288c54c64fce9b6a3eb2226e1f290e67 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_08-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bc6ed5545b303e09555cb45919d8541a90970c5 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc594122877f08c80476837b1782745cd90fcd4b3b972a57900b2ac71d30a4c8 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_09-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..205f4f69bac32042e36b23b2818a6417cba4c9af --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9d1bf421257066e6ea29f288e800d4815f9115cc6ad2ac5faa20b5545fcc677 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_10-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c5fc700f1aa03af724ee2722a7620216cc70539 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4c6309a16decbd28561001b06cad1702a8efd7391f24a103aa14edd9bb770e4 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_11-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5718ba24e3bec6fba76a9cef73f093afab0ec97e --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73be103c7d3bdf53ceb75d509d0b6b5d6341740235b056c8e2fb1ef12cce5911 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_12-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b79275acb1990c970919e7d262c92cab859f6197 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b52880d5dede95c7256d0d17f735addfae3a830d14440812f35cd5fed47b50e3 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_13-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06215e863764947efeee0d13db24eb1de423d27e --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7e276857d14373e9195deda77e95706924783041f4981f301fd950943af8e28 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_14-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..278114a13a99d26c3bdafdb60ec02aaeed2b178e --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7462b79470adae6a1d6b227aaffccb3c7f82c2d2c107a4debe5ecd430a2e71e1 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_15-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16701b707c53b80d9762fc2fb48630507b46bf09 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d378f2487973bbb96cb395a9534219dea90070f4623908b3e65fa94280df270f +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_16-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51fd675601a9a0ca5820a7ff20205a499005aea7 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ebf5dcc9395316d7f7c556720f34e8e60ce9590e17b510c6a11eb56698a5eec +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_17-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4edcdb97c1828630540b2a74fcbd0268aa565959 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e65093ce766ea38e736301d767a775d34b4e84672ba965482671259f742f37c9 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_18-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96693bbcb860d4f9b308520bac1221a824c199ce --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b717649d8c2d3e4d07587bc4df804954c9692a84acc2fce56afa053578b2e9a2 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_19-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fbf2c94be8c8c9e0ecc2d64f5a556dd67f0504a --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15c47726f2dd1e6e0f1b2f69c6581f9a76e2f1ebc8590d9dbf49495aca22f1f3 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_20-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8aa79573bad9fa3f098d6d9b465f8e0eb2e8b914 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9477c7d89aea1a79015d47db2d3be68d897f16fc20b1898748240a39142a7e33 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_21-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c9024298e4f35fd7543f3ecffcb422226989373 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:833432bc0bf0b5ea14b935775eb7c4b5505c6fc6618853dc209e4e99ebde0636 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_22-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e50ffe16ee9c41c92debfa73d85d7164fd24398 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d3727b925bf1d12a4af386171785cac496b7ded854be1e82e182c2f118282e8 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_23-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9cb08985d4d3a7c85a0b654581850788d34cf94 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7237816b2b9a30cb8ccef0ff0a63a3c72206dd412c827c9c06fa6fab57673cad +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_24-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd91f020930226312adb2768600a6dc0add4db12 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d48cde83102ccce5cb98679ad2aa826ac7b30078fc7813ce2a573b8804a3e529 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_25-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1548fdaf57645b17124d31b56597735f33f587b --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3ceddf5030cc7c22a28ac2e6de583510ad78728bff6cd69149ec82c0729f638 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_26-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..027f1fd9e966561f66edddb10d301232c8b80367 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5926bbaa40c949693eba0ce5f575711dbd928faeecf632f0a466d11ce52a8153 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_27-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..599d03485321e96b88b62e40e11415a83edd8b12 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d753ec638c861ae9c840b0e0bc8d780bae3e388efa403f15278f44f6f1992eea +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_28-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..960c315fdf0c031c21d833fd2d524ab79905b9b9 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c101e1861eb4c4e6a46fe43766c06064479b91ed24ba8bd6008c81d35850c368 +size 77121283 diff --git a/1b121b21bc4seed2/global_step39672/layer_30-model_00-model_states.pt b/1b121b21bc4seed2/global_step39672/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92968f2f9e51a3e48654b049df8406f67ab8b8b0 --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c83c8d1b98e4b8c4399013435957e619719127061e072a192115a91b2de3f91 +size 8387 diff --git a/1b121b21bc4seed2/global_step39672/mp_rank_00_model_states.pt b/1b121b21bc4seed2/global_step39672/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ccdcbf947069bb72e62423c31e636ad888d098b --- /dev/null +++ b/1b121b21bc4seed2/global_step39672/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08181c96249f2f008d93dd633333bc103965f5eafbe3a8cd1da514ca87b0d214 +size 43827 diff --git a/1b121b21bc4seed2/transformers/config.json b/1b121b21bc4seed2/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7120acb75187622c061f0425674b658dd9155502 --- /dev/null +++ b/1b121b21bc4seed2/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50304, "n_positions": 2048, "n_embd": 1792, "n_layer": 26, "n_head": 14, "n_inner": 7168, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/1b121b21bc4seed2/transformers/pytorch_model.bin b/1b121b21bc4seed2/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..ee70ea40f299a5f7b528b2c90e21a2bce70a95b0 --- /dev/null +++ b/1b121b21bc4seed2/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:326f1bcc033b1d4e29f6c9ec439bd918efe569d48d24428a4a407be770b0612e +size 2410895501 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_0.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_1.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_2.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_3.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_4.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_5.jsonl b/1b121b21bc4seed3/evaluation/generation/examples.1b121b21bc4seed3_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/1b121b21bc4seed3/evaluation/generation/merged.csv b/1b121b21bc4seed3/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..8d4ad2a8389c889b720cdeadb760a63ce6875229 --- /dev/null +++ b/1b121b21bc4seed3/evaluation/generation/merged.csv @@ -0,0 +1 @@ +dataset,fewshots,prompt,metric,value diff --git a/1b121b21bc4seed3/evaluation/generation/merged.json b/1b121b21bc4seed3/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..9e26dfeeb6e641a33dae4961196235bdb965b21b --- /dev/null +++ b/1b121b21bc4seed3/evaluation/generation/merged.json @@ -0,0 +1 @@ +{} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d2837d6a10508acb8c75defe045faba94a419ad9 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.28572015895181313, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.029996683677028884}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06275107464568752, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001482626784800971}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2653496514419625, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0044301076161033445}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09566430048114055, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019833726857373933}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03009186338419653, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009122332803552036}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1306746149712155, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003040441899500505}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.045926667677568665, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012416071370673657}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06029258655079738, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013643648691810868}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.25861360612073325, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004336001927934783}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09229607491866483, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018548951773486634}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0599952987639967, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013920010929440471}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.25468022554337166, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00416218635602354}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.0914984902210792, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018580702167419888}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..dc6bb1d0215f29382614b4d1c8b2f49ece86b2e0 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.2733809666843245, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.017469945535516233}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06127827669468516, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014475626789825216}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2912358718895091, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0047559174768431}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09465272634611742, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018532707516154}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.028424762596691282, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009872409719648724}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.13634361210693505, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0031518261028729865}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.043447331936707745, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011595853852308454}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05798019246549793, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013348612234876421}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2756227919098518, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004404790096916205}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08967525096022803, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017040144863156993}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0584971868634523, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001386020107167148}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2763902169531308, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004392872739454734}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09023227224081035, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017566163632365401}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..3d4a299b621e163578a34f971bea16ef2983dd03 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.27692663560456576, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.020364718206970903}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06147368851457221, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012623013185335313}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.30263039971208694, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004760584060971739}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09625717915221209, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00174014878444931}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.028063334403907188, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007662392196332797}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.14354815751347613, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032059165700188356}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.044005340063557, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010837646169888715}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05786141529156912, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011333739480816865}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.286302289137813, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004385346387690765}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.0907708660179587, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015736293804571027}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.058721463920226806, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012062193203122612}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.287696314630283, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004428617061773817}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09187344007508645, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016563753568251043}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..11f9c03b430b9f5b08475f892960fee365b5aae4 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.29659125910672235, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.016882600262624867}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06145887932212597, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012169314124561455}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.30505300258942414, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0047261670100499364}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09650412351241988, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00167247613646195}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.027901257259455022, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007085509669261345}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.14687843284043367, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032247187337236904}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04405862636243696, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010210491782955636}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05816779259264925, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001101022422405542}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2897233872600757, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004365094346814999}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09147131174467073, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015248452457480056}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.058548171185912525, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011357565151254563}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2895152165474746, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004340778368401744}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09190353821219928, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015652081391078101}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..e6ad487a1dd9a5010ffc0f1c2e12ee4403c520c5 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.32349384025701167, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.021841302866309788}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0625728361410853, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012585041311395817}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3094168818387454, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004729097260215436}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09824537940970629, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017168314347721003}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.028682921178866484, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007563993720637289}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.15044042342708142, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003333834053934159}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.0452158613394661, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010697836859867177}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.059023081811736294, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011089492079030946}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.29435917450238935, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0044243064370870335}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09288695263220921, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015312884011513372}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.05982186254258612, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011713233210840226}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2960727424843719, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004432691110581699}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09395763356452147, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016024157843164731}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..61cdfbf1fe2dc48cd0af0c07632f4ab931ba1d7b --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3317247520236422, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02438683801110983}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06471426127247473, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0012898743879850927}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3220301197483266, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004784458908262577}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1015968420316754, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017067334576059984}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.029766999027414025, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008118603022394101}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.15682390612074046, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0033732274141397736}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04683784475546268, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010906780700661233}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06064903145944483, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011531567240369417}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.30378656882887267, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004419672235023449}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09534760210410158, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001533464120564557}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.061657852757433344, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012078523776645487}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3073326718000021, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004475310017341517}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.0967982427270365, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015966272469230514}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..413c91cd624e79b4a7efb53536062453676d5e1b --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.13780680503285866, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001963222074069445}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2300113800580128, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027523450735060214}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.15995178659481124, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019476998067523457}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.027958971164094862, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007185096475725596}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04802627198798666, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012953632843939321}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0325449603413564, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007946537089430446}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10894258616198119, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014095848399899374}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.18869266341630972, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022499271779208518}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12806903787214233, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001432165288725186}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.12619303410814398, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017830267623956222}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2118167894154195, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025399740287383532}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.14672463644520317, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017705329316914052}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.4715584716266366, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05979035173894537}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..088ccda5a4ca3cf6b1acaf765714082d1af39199 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.14303855949220973, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017883259547811035}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2404640566053214, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025568167624806268}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1659619521945487, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017255813810933987}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0247139355641883, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006686054027706484}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.043281756890626494, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012894489706408074}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.02872278229177072, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007406492584205885}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10120656325023195, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011799928185521268}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.17663608162711542, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0019540696402957683}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.11865039810855227, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0011448070269801268}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.133863409884033, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016645742544581718}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.22590717474478603, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024041420866198616}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15546750970375475, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016049368612675332}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.4105754686734944, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05004327536852838}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..bc2db3de079ecba57d7b03fbda26d443b950fdba --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1405364837901601, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001939748022665139}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.22575505407910562, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002550117228501278}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1592319273466656, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001799066929060303}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.025662875444857295, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007691462288959418}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04175150895044056, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001189901549490804}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.028841983524197482, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007611631081205323}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1083364462309822, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001405789374506379}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.17872732097294958, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.001999408312244932}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12364040415407823, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012736531821000415}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13103000490181455, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018143737843109569}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2109444720461656, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023822951303522515}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.14844491271068486, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016652808137804262}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.2900289618857925, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04780794942619469}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ced0139ffa1011ff45521bee1ab0120e290a59da --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.12509614688619689, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002228795608935358}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.18767300213224564, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028539387200514476}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1342644995667986, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019642297496972366}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.024250258441802567, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009026138649276358}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.037597498222217, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012860828030060772}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.025820231326483496, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007752810347348394}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.0999116738568996, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017693027578086957}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.15265267010514852, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023328283894968257}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1073751120661638, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00149029795685705}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.11675484033349125, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002089428868664697}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.17579490426422517, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00269019117553292}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.12525446512455207, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001822028086382638}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.4599914767802553, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0635195569874681}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..5867d63c7fd0100bc21d9a1a892545cc73826c17 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.04485321962453146, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017875667294004294}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.06630548480377385, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0024064841997783804}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.04622406565185966, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016303591829101983}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.008654276655755648, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0005433398891243852}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.013973442151458024, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0008607910239468982}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.009339471992932759, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005238484713453825}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.03703928516688903, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014780279022334575}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.05553695501709392, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020162336010684924}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.03817435899320631, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001315667296339476}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.04131778962417704, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016612472366310286}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.061078533602158244, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0022269504871210042}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.04244591804424164, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0014960454994858057}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.3702833561251355, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.030351290737556852}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..f9329fe4bb3c9767b6c20898c53c83b3cee2578c --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.007895152558976005, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.000844472965838446}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.011330805175563327, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0011068236259164767}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.007838938488476992, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0007592053204344529}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.001828752443277852, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0002833369118955633}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.002712234792676449, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00040657012932559535}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0017395393632540774, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00022581320583642028}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.006451660866714186, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006761070510151714}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.009434380372514109, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0009165354870618827}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006459264593320741, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006146390001712349}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.007220742560238168, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007677030305742829}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.010470405484261038, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0010219886346664543}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.007176068947718324, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0006890108922026801}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.0605881261031538e-06, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.8732681876015495e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..9287405276eeba12c7f2bc91b0c8779547205d87 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 1.0756224564831869, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.064362467364649}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.2588235923286985, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004562924193018284}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.09771851611832182, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0018076944872090492}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.11475475475567845, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016267727810947243}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.07095225790843339, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.004012167691904306}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.018594174934204018, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.000789200672023998}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.017364866430399792, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0006257195214464453}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.24270724404000282, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004446165912080725}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.09270329159251155, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.001777052888516187}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.10751161947929294, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015525911247785784}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.24212046048078248, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004500843067139839}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.08721014170888262, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0015860867044055972}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.1043086079779956, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001501216899123504}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..d16ef93de1a14e90ba4dd7d1297033d089cb3d29 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.6340703914383115, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07802081757825902}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3496844195497873, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0030957066657378565}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4061353589201485, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003002747367144736}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3364924250714533, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019671670892094355}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.13845324209640059, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0019371833648373655}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1632725866215026, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001973962532025402}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.132388948988302, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014487165943513271}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2545418793110184, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002536135977755477}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.29266138157442667, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002359605268115721}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.242613336164728, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015890115418894523}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2888554888362579, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002735901233949605}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3379353521201237, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027651147680515984}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.278605840076953, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018385587325905528}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..99ddd54bd4800f3a696b67012e8cb13acbe04b9e --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.742107948398635, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10028477164759789}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.29565325420243477, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002453588842828844}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4646488423809536, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027682272923222795}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3384601198644487, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018343529202461447}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.12425161790639815, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015558836535121063}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.19872852519022988, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020164549706803304}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.1419143590408358, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013500831164610805}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2129530997072588, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019300729133295007}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3366936529804091, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022835557117666257}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.24356776108805483, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014311711089907218}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.24845067554530403, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021647527757715974}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3927861198246419, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026411848326427685}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2851684134761103, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017343585089839761}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..1a9c41e857953c731866a0e2b8af18838a99508a --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.4394699721339945, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09285202216690835}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.29243082212800253, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002007031392393103}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.48658038595985936, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026693414154091597}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3506865804173511, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001779876639899985}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.12274569253499107, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012683595348881287}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21168968767895338, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002098325368391887}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.14866896202149463, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013547963115074187}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2109600351766481, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001491743890572953}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3561629922763884, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002290230370810661}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.25402678782725335, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001368780824274314}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.24846793909198966, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018381867412554272}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.41481465361399206, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025983611700810586}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2983343530741974, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017256887817233195}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b58bf3249c1e787e0c6f17783b4ba17136545590 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.654273843780829, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0932390666677247}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.2898424902183153, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018791763712852315}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4929161644601487, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026458279648224167}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3528059349016549, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018000619625855965}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.12270875266797653, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012167312451751447}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21534342954879904, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002091583190898679}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.15067447176529838, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013670254769562427}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2113572265707145, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013806305214041975}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3649431060660491, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023133142967620376}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.25852736725378506, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001401625539515259}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2474150705640244, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017363350028745841}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.42231678078769985, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026287105060156485}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3015553223695305, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017613480944054503}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..4edec82b92fa77f1582022621eb7b48050f6b911 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.802357053111681, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07951699425220059}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.28820052977309235, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001819335493032039}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4993875209074646, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026615979174856954}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3535514791757511, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017635886054965901}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.12189364791898503, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011831105686679357}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21913595621439114, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002096881385232064}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.15104186792993882, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013321860839076213}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.21046833185620123, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013409452808175167}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3703034038335145, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002340534182475654}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.25938421101288645, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001370532445107939}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.24705433680949515, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016874826622658786}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4296857608506914, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026271257379257085}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.30345160047433223, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017236299574653685}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_0.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..218cf7ece579aa1953ffcf675ecc4ab785e5c5f4 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1319584869435511, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017902371313440575}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.31843751119441815, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004065977532742336}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.18386318990595807, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023608331228326847}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.026550837358487143, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009488542686212192}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06687473448752221, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002449110168641438}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0374406012181181, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013279313692357727}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10262840876555364, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013137229936401066}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.25005919357583545, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0032044045017060904}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14334972946860364, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017554946172280554}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10286501129146305, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001455767441117724}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2505082141618244, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003526620853397989}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14367399097871014, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019591856753464845}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.3878211321327552, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0855819143667016}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_1.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..937bedd8a65f1dff34396528f423a674a1a55675 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1019316787156134, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001581412043974921}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.25568536664121694, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003700241675446601}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1439882099204442, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021362210922445256}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.015540487617390818, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007529217251141928}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.040635472267349405, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020138507639145733}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.022185877818879655, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001068255036385278}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08189228355883127, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001197668399441684}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.20681340108359003, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0029102146053896064}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.115878171942197, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001626602377075275}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.08167666249359884, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012870273117968705}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.20631942492572855, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0031137041096314646}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1155841559891562, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017520660679357471}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.8832546884814032, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.058811836402674386}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_2.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..60e933e5c022259cf9dca270322f5f8b4b738078 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.10290215824360217, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015231953673864073}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.26058699720865636, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0035894470214097272}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.14583874695098636, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002065306633050135}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.014737945386577267, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006786127154562599}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.038568668595477, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001838244973766507}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.021091747556253763, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009730085187477109}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08227413818990617, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011579755263600813}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.20926439309232098, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002780994834995758}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.11670562169943377, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015709631453015703}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.08215243516848891, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012349033736966245}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.20976643212478632, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0030372441678568622}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.11667262595327746, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016928169860876325}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.7747833335044035, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0735019876667231}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_3.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a6bea9fcc8a8e1142a4a6502aee3c20c4f9f2cc0 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.10120153706706152, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017736330055289858}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.24519867618515012, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003884692967238667}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.13973819965273176, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002224503682788521}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.013495672385084116, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006604205765928289}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.03480405814644667, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017521611060424783}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.019151399470871626, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009352465834774729}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08110610044359444, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013403478299354114}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.19805114955706876, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003043793566262139}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.11223173860379815, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016815182785500226}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.08047900097695888, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014125980225232948}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.19685244716798667, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032305682822595357}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.11137976210396107, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017894136517198234}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.7090873399844934, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06349488292701568}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_4.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ecbd59ebb4459086c8e58c7bec7a25ff14391da8 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.033726207169633135, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0022496434684974704}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.06113232730210851, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0035415467033274375}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.03868164502577274, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00218983828011114}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0039452222901913215, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00047080278624595537}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.008587166126189389, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.000991502763473968}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.005136520819314499, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005785064861652664}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.027341393262343253, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018583846671984688}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0490770784043296, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002826446970390225}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.031102614205213132, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001750893236380802}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.027572756891097318, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018634013892600786}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.04978804160990521, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002882491425762946}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.031460267393699226, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017703108056970776}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.36966928598813426, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07413204217069384}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_5.json b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..d85d22857c2686cf19e2a3bf501c090a020ca4aa --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/agg.1b121b21bc4seed4_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.002416790871504932, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.000690024976317744}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0020318495670589333, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.000586319326403082}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.002116700789094782, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0005901490166052325}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.00016686975621492826, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 9.709108848912936e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0001078167115902965, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 6.282744363562356e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.00012903395324011984, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 7.455004604564479e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0017258055760596795, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0004998666139598835}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0013501651107790925, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00036589324228248303}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.001471166405296428, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00040793599808869183}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0019222911396811744, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0005311080623757342}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.001572836788867691, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00042709396031823143}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0016630690627148653, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00044252995979777765}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 3.696651377011743e-40, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 4.625530268515257e-36}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..735d19ccb7f25a6c03e1d35e348742bec0ff78a5 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa4a3c40d8c2d51270382d9a8622636c30ce901170e04b88382cdd4c7498b2a5 +size 4164858 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3dd2316091f957c9cbc30819dd57debb89170a16 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c7acfd8c6ac9265f27d3e91e2d277260d39d0b412a87cfef4ca2d43e7d79531 +size 5156927 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c473de8d36d6288c55104a0743cea542e30b9e3e --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a64d4b6a254da51ad30d01fb57a616057808e1c54440e7b16ae2b2959741d13b +size 6046465 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2d4696da97523c45c4a0321c96642580c6aed2c1 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:739bdb524e7207a3b8a372d226016d10a76759968380a74d01e2837170a8081a +size 6933828 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d123e10612c34c7cf9554ed25119c5d089dd757d --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9b7c4b4c605f6e10cbe9e195482836156377fa49a65596f138e5e8d28a1b325 +size 7835092 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ef9b845a86832276fdd935fbc98813dbf176f0d4 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58e0a6285a6ae6a83b8ab91c3b528fa511086447bfd0fb3396d8193d389b1f2f +size 8731231 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e587d90353537c7d488ec9e6bd29ad25fa77f09c --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2318924ec6c79ac550bcc940ada44692355860a5ea71109d5813b32367a999a1 +size 7647577 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a12b93ae82928427b930254f94c26f7e40f41010 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b73628460559ea83775004d28a622216004faaefce1c154f70d7de3da293a77b +size 13338857 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d36db44c4c16e501b06792affd641186bfe14398 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48374e4fd65361b8743b96f9142e8afcf81ac9328d3ccc626e46b82b1dbcc849 +size 18915150 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..80f9e3ea2b0e6eff687e87836ca6f3d3be22f635 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91a56d149f9c273d2c7a469d35732a8cf6464336fbcb8fda7cf78a210a6437cc +size 24322314 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e0605dacdd0b75d7d4c7a323ca73b4d96cd22640 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aef01ae7a3fa55383fc3519e9335f9c52d4b0e6121c3b0a774214a0fc4c1bbd2 +size 29470186 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c6e2300a74375b480e762a6f32f0a47104d58e2e --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d970e26bf958ba2bd100dd107d84d8786cda74ed58c539abd261e3f29f2b19d6 +size 34799229 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..dd6c07525bb0c0a04b651f2d85976d9c13bc1c47 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0305c4e8078e03bf36cf43eaa307a427f905d7bc052443addafa8f394a0f741 +size 3836961 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a015e8aa3f5aec882fed37954726062c59d82846 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53531073a324aebce46c43b36a60a1f96bef7b25b247dc1b0a0420985aeef99c +size 5259516 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e969da43f8c7c1124f7259b87bff92b177983973 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4864829c60166aa69b6b453356e9567bd351bb2fa839e40a30bb885ed4defec +size 6487526 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b60f3099d7997bc17da9e810662bbd1da25947d0 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a71ae8c82c6371554db79c1d92ccc4a15bb65a8c41a0fceae5f30fcbd77f3c4 +size 7579139 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b5b24c925b028bd98a6216771af0455179a06891 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9964ad83a330f5fc2599de4c4b4e5be0fc6a35d96e82785ccc223bcc32b51ef7 +size 8666380 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a2e27a8a4f302d6aaa79dedb8f03bcb50861a892 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f5d2aa46ecb624a15f2036eb5f0447b8c2eb6095ddf79ca16d39592d2ce7be6 +size 9763330 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_0.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..317dc8c2574b34489f34b217664b42c909eb2ada --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc06dac5d6dbb610a373460be20288cd027b066fde7379d4131764fd572b799c +size 2834746 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_1.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..503b72ffc6d5fb0c4fb964497975a82a9f57f270 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93cbfe830314c7c3af8d0f0225e2391becec4be7c659fa7f659b5813df47d3e2 +size 5107033 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_2.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..05c018500f6b1c4b9a5b8427b984d3d8666a6eb5 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:695d149d77d70e84f92ccd3b414e5b3880593d950cbf05badc222eb856a31624 +size 7381991 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_3.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..39b8dd3a6a68eca8411547500ba91ed203f23b88 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b79c4301b0117d9ac1e2c2e67ae97a3c7061a54135a2a9f502422b6db0bae13c +size 9649588 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_4.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..10ab940244a274a2d2778e9082540adf6cc30195 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e63129a30926f081f4adb8ce91e499faa6ab0c6e387d89e96b62d45f1d304ba +size 11673585 diff --git a/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_5.jsonl b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ea6bf64cac7c84bc10d6a0367604c94bbe60fef4 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/examples.1b121b21bc4seed4_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60b71e3ec88a4710787bf271f8ddea06ae49840f6b83d6ecbf952d19599d401f +size 13897493 diff --git a/1b121b21bc4seed4/evaluation/generation/merged.csv b/1b121b21bc4seed4/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..6b72804a7b4952e45810b89c7a5f12beddd586af --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.017364866430399792 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.017364866430399792 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.132388948988302 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.132388948988302 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.1419143590408358 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.1419143590408358 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.14866896202149463 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.14866896202149463 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.15067447176529838 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.15067447176529838 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.15104186792993882 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.15104186792993882 +e2e_nlg_cleaned,5,average,multiple,0.12367557936271156 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.0374406012181181 +gem_xsum,0,median,rouge2_fmeasure,0.0374406012181181 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.022185877818879655 +gem_xsum,1,median,rouge2_fmeasure,0.022185877818879655 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.021091747556253763 +gem_xsum,2,median,rouge2_fmeasure,0.021091747556253763 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.019151399470871626 +gem_xsum,3,median,rouge2_fmeasure,0.019151399470871626 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.005136520819314499 +gem_xsum,4,median,rouge2_fmeasure,0.005136520819314499 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.00012903395324011984 +gem_xsum,5,median,rouge2_fmeasure,0.00012903395324011984 +gem_xsum,5,average,multiple,0.017522530139446293 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.045926667677568665 +web_nlg_en,0,median,rouge2_fmeasure,0.045926667677568665 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.043447331936707745 +web_nlg_en,1,median,rouge2_fmeasure,0.043447331936707745 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.044005340063557 +web_nlg_en,2,median,rouge2_fmeasure,0.044005340063557 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.04405862636243696 +web_nlg_en,3,median,rouge2_fmeasure,0.04405862636243696 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.0452158613394661 +web_nlg_en,4,median,rouge2_fmeasure,0.0452158613394661 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.04683784475546268 +web_nlg_en,5,median,rouge2_fmeasure,0.04683784475546268 +web_nlg_en,5,average,multiple,0.04491527868919986 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.0325449603413564 +wiki_lingua_en,0,median,rouge2_fmeasure,0.0325449603413564 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.02872278229177072 +wiki_lingua_en,1,median,rouge2_fmeasure,0.02872278229177072 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.028841983524197482 +wiki_lingua_en,2,median,rouge2_fmeasure,0.028841983524197482 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.025820231326483496 +wiki_lingua_en,3,median,rouge2_fmeasure,0.025820231326483496 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.009339471992932759 +wiki_lingua_en,4,median,rouge2_fmeasure,0.009339471992932759 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0017395393632540774 +wiki_lingua_en,5,median,rouge2_fmeasure,0.0017395393632540774 +wiki_lingua_en,5,average,multiple,0.02116816147333249 diff --git a/1b121b21bc4seed4/evaluation/generation/merged.json b/1b121b21bc4seed4/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..5b66a18f6cae56ee09fddd75e4c241c682a5e9fa --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.28572015895181313, "bleu_stderr": 0.029996683677028884, "rouge1_fmeasure": 0.09566430048114055, "rouge1_fmeasure_stderr": 0.0019833726857373933, "rouge1_precision": 0.06275107464568752, "rouge1_precision_stderr": 0.001482626784800971, "rouge1_recall": 0.2653496514419625, "rouge1_recall_stderr": 0.0044301076161033445, "rouge2_fmeasure": 0.045926667677568665, "rouge2_fmeasure_stderr": 0.0012416071370673657, "rouge2_precision": 0.03009186338419653, "rouge2_precision_stderr": 0.0009122332803552036, "rouge2_recall": 0.1306746149712155, "rouge2_recall_stderr": 0.003040441899500505, "rougeL_fmeasure": 0.09229607491866483, "rougeL_fmeasure_stderr": 0.0018548951773486634, "rougeL_precision": 0.06029258655079738, "rougeL_precision_stderr": 0.0013643648691810868, "rougeL_recall": 0.25861360612073325, "rougeL_recall_stderr": 0.004336001927934783, "rougeLsum_fmeasure": 0.0914984902210792, "rougeLsum_fmeasure_stderr": 0.0018580702167419888, "rougeLsum_precision": 0.0599952987639967, "rougeLsum_precision_stderr": 0.0013920010929440471, "rougeLsum_recall": 0.25468022554337166, "rougeLsum_recall_stderr": 0.00416218635602354}}, "1": {"PALM_prompt": {"bleu": 0.2733809666843245, "bleu_stderr": 0.017469945535516233, "rouge1_fmeasure": 0.09465272634611742, "rouge1_fmeasure_stderr": 0.0018532707516154, "rouge1_precision": 0.06127827669468516, "rouge1_precision_stderr": 0.0014475626789825216, "rouge1_recall": 0.2912358718895091, "rouge1_recall_stderr": 0.0047559174768431, "rouge2_fmeasure": 0.043447331936707745, "rouge2_fmeasure_stderr": 0.0011595853852308454, "rouge2_precision": 0.028424762596691282, "rouge2_precision_stderr": 0.0009872409719648724, "rouge2_recall": 0.13634361210693505, "rouge2_recall_stderr": 0.0031518261028729865, "rougeL_fmeasure": 0.08967525096022803, "rougeL_fmeasure_stderr": 0.0017040144863156993, "rougeL_precision": 0.05798019246549793, "rougeL_precision_stderr": 0.0013348612234876421, "rougeL_recall": 0.2756227919098518, "rougeL_recall_stderr": 0.004404790096916205, "rougeLsum_fmeasure": 0.09023227224081035, "rougeLsum_fmeasure_stderr": 0.0017566163632365401, "rougeLsum_precision": 0.0584971868634523, "rougeLsum_precision_stderr": 0.001386020107167148, "rougeLsum_recall": 0.2763902169531308, "rougeLsum_recall_stderr": 0.004392872739454734}}, "2": {"PALM_prompt": {"bleu": 0.27692663560456576, "bleu_stderr": 0.020364718206970903, "rouge1_fmeasure": 0.09625717915221209, "rouge1_fmeasure_stderr": 0.00174014878444931, "rouge1_precision": 0.06147368851457221, "rouge1_precision_stderr": 0.0012623013185335313, "rouge1_recall": 0.30263039971208694, "rouge1_recall_stderr": 0.004760584060971739, "rouge2_fmeasure": 0.044005340063557, "rouge2_fmeasure_stderr": 0.0010837646169888715, "rouge2_precision": 0.028063334403907188, "rouge2_precision_stderr": 0.0007662392196332797, "rouge2_recall": 0.14354815751347613, "rouge2_recall_stderr": 0.0032059165700188356, "rougeL_fmeasure": 0.0907708660179587, "rougeL_fmeasure_stderr": 0.0015736293804571027, "rougeL_precision": 0.05786141529156912, "rougeL_precision_stderr": 0.0011333739480816865, "rougeL_recall": 0.286302289137813, "rougeL_recall_stderr": 0.004385346387690765, "rougeLsum_fmeasure": 0.09187344007508645, "rougeLsum_fmeasure_stderr": 0.0016563753568251043, "rougeLsum_precision": 0.058721463920226806, "rougeLsum_precision_stderr": 0.0012062193203122612, "rougeLsum_recall": 0.287696314630283, "rougeLsum_recall_stderr": 0.004428617061773817}}, "3": {"PALM_prompt": {"bleu": 0.29659125910672235, "bleu_stderr": 0.016882600262624867, "rouge1_fmeasure": 0.09650412351241988, "rouge1_fmeasure_stderr": 0.00167247613646195, "rouge1_precision": 0.06145887932212597, "rouge1_precision_stderr": 0.0012169314124561455, "rouge1_recall": 0.30505300258942414, "rouge1_recall_stderr": 0.0047261670100499364, "rouge2_fmeasure": 0.04405862636243696, "rouge2_fmeasure_stderr": 0.0010210491782955636, "rouge2_precision": 0.027901257259455022, "rouge2_precision_stderr": 0.0007085509669261345, "rouge2_recall": 0.14687843284043367, "rouge2_recall_stderr": 0.0032247187337236904, "rougeL_fmeasure": 0.09147131174467073, "rougeL_fmeasure_stderr": 0.0015248452457480056, "rougeL_precision": 0.05816779259264925, "rougeL_precision_stderr": 0.001101022422405542, "rougeL_recall": 0.2897233872600757, "rougeL_recall_stderr": 0.004365094346814999, "rougeLsum_fmeasure": 0.09190353821219928, "rougeLsum_fmeasure_stderr": 0.0015652081391078101, "rougeLsum_precision": 0.058548171185912525, "rougeLsum_precision_stderr": 0.0011357565151254563, "rougeLsum_recall": 0.2895152165474746, "rougeLsum_recall_stderr": 0.004340778368401744}}, "4": {"PALM_prompt": {"bleu": 0.32349384025701167, "bleu_stderr": 0.021841302866309788, "rouge1_fmeasure": 0.09824537940970629, "rouge1_fmeasure_stderr": 0.0017168314347721003, "rouge1_precision": 0.0625728361410853, "rouge1_precision_stderr": 0.0012585041311395817, "rouge1_recall": 0.3094168818387454, "rouge1_recall_stderr": 0.004729097260215436, "rouge2_fmeasure": 0.0452158613394661, "rouge2_fmeasure_stderr": 0.0010697836859867177, "rouge2_precision": 0.028682921178866484, "rouge2_precision_stderr": 0.0007563993720637289, "rouge2_recall": 0.15044042342708142, "rouge2_recall_stderr": 0.003333834053934159, "rougeL_fmeasure": 0.09288695263220921, "rougeL_fmeasure_stderr": 0.0015312884011513372, "rougeL_precision": 0.059023081811736294, "rougeL_precision_stderr": 0.0011089492079030946, "rougeL_recall": 0.29435917450238935, "rougeL_recall_stderr": 0.0044243064370870335, "rougeLsum_fmeasure": 0.09395763356452147, "rougeLsum_fmeasure_stderr": 0.0016024157843164731, "rougeLsum_precision": 0.05982186254258612, "rougeLsum_precision_stderr": 0.0011713233210840226, "rougeLsum_recall": 0.2960727424843719, "rougeLsum_recall_stderr": 0.004432691110581699}}, "5": {"PALM_prompt": {"bleu": 0.3317247520236422, "bleu_stderr": 0.02438683801110983, "rouge1_fmeasure": 0.1015968420316754, "rouge1_fmeasure_stderr": 0.0017067334576059984, "rouge1_precision": 0.06471426127247473, "rouge1_precision_stderr": 0.0012898743879850927, "rouge1_recall": 0.3220301197483266, "rouge1_recall_stderr": 0.004784458908262577, "rouge2_fmeasure": 0.04683784475546268, "rouge2_fmeasure_stderr": 0.0010906780700661233, "rouge2_precision": 0.029766999027414025, "rouge2_precision_stderr": 0.0008118603022394101, "rouge2_recall": 0.15682390612074046, "rouge2_recall_stderr": 0.0033732274141397736, "rougeL_fmeasure": 0.09534760210410158, "rougeL_fmeasure_stderr": 0.001533464120564557, "rougeL_precision": 0.06064903145944483, "rougeL_precision_stderr": 0.0011531567240369417, "rougeL_recall": 0.30378656882887267, "rougeL_recall_stderr": 0.004419672235023449, "rougeLsum_fmeasure": 0.0967982427270365, "rougeLsum_fmeasure_stderr": 0.0015966272469230514, "rougeLsum_precision": 0.061657852757433344, "rougeLsum_precision_stderr": 0.0012078523776645487, "rougeLsum_recall": 0.3073326718000021, "rougeLsum_recall_stderr": 0.004475310017341517}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.4715584716266366, "bleu_stderr": 0.05979035173894537, "rouge1_fmeasure": 0.15995178659481124, "rouge1_fmeasure_stderr": 0.0019476998067523457, "rouge1_precision": 0.13780680503285866, "rouge1_precision_stderr": 0.001963222074069445, "rouge1_recall": 0.2300113800580128, "rouge1_recall_stderr": 0.0027523450735060214, "rouge2_fmeasure": 0.0325449603413564, "rouge2_fmeasure_stderr": 0.0007946537089430446, "rouge2_precision": 0.027958971164094862, "rouge2_precision_stderr": 0.0007185096475725596, "rouge2_recall": 0.04802627198798666, "rouge2_recall_stderr": 0.0012953632843939321, "rougeL_fmeasure": 0.12806903787214233, "rougeL_fmeasure_stderr": 0.001432165288725186, "rougeL_precision": 0.10894258616198119, "rougeL_precision_stderr": 0.0014095848399899374, "rougeL_recall": 0.18869266341630972, "rougeL_recall_stderr": 0.0022499271779208518, "rougeLsum_fmeasure": 0.14672463644520317, "rougeLsum_fmeasure_stderr": 0.0017705329316914052, "rougeLsum_precision": 0.12619303410814398, "rougeLsum_precision_stderr": 0.0017830267623956222, "rougeLsum_recall": 0.2118167894154195, "rougeLsum_recall_stderr": 0.0025399740287383532}}, "1": {"tldr_en": {"bleu": 1.4105754686734944, "bleu_stderr": 0.05004327536852838, "rouge1_fmeasure": 0.1659619521945487, "rouge1_fmeasure_stderr": 0.0017255813810933987, "rouge1_precision": 0.14303855949220973, "rouge1_precision_stderr": 0.0017883259547811035, "rouge1_recall": 0.2404640566053214, "rouge1_recall_stderr": 0.0025568167624806268, "rouge2_fmeasure": 0.02872278229177072, "rouge2_fmeasure_stderr": 0.0007406492584205885, "rouge2_precision": 0.0247139355641883, "rouge2_precision_stderr": 0.0006686054027706484, "rouge2_recall": 0.043281756890626494, "rouge2_recall_stderr": 0.0012894489706408074, "rougeL_fmeasure": 0.11865039810855227, "rougeL_fmeasure_stderr": 0.0011448070269801268, "rougeL_precision": 0.10120656325023195, "rougeL_precision_stderr": 0.0011799928185521268, "rougeL_recall": 0.17663608162711542, "rougeL_recall_stderr": 0.0019540696402957683, "rougeLsum_fmeasure": 0.15546750970375475, "rougeLsum_fmeasure_stderr": 0.0016049368612675332, "rougeLsum_precision": 0.133863409884033, "rougeLsum_precision_stderr": 0.0016645742544581718, "rougeLsum_recall": 0.22590717474478603, "rougeLsum_recall_stderr": 0.0024041420866198616}}, "2": {"tldr_en": {"bleu": 1.2900289618857925, "bleu_stderr": 0.04780794942619469, "rouge1_fmeasure": 0.1592319273466656, "rouge1_fmeasure_stderr": 0.001799066929060303, "rouge1_precision": 0.1405364837901601, "rouge1_precision_stderr": 0.001939748022665139, "rouge1_recall": 0.22575505407910562, "rouge1_recall_stderr": 0.002550117228501278, "rouge2_fmeasure": 0.028841983524197482, "rouge2_fmeasure_stderr": 0.0007611631081205323, "rouge2_precision": 0.025662875444857295, "rouge2_precision_stderr": 0.0007691462288959418, "rouge2_recall": 0.04175150895044056, "rouge2_recall_stderr": 0.001189901549490804, "rougeL_fmeasure": 0.12364040415407823, "rougeL_fmeasure_stderr": 0.0012736531821000415, "rougeL_precision": 0.1083364462309822, "rougeL_precision_stderr": 0.001405789374506379, "rougeL_recall": 0.17872732097294958, "rougeL_recall_stderr": 0.001999408312244932, "rougeLsum_fmeasure": 0.14844491271068486, "rougeLsum_fmeasure_stderr": 0.0016652808137804262, "rougeLsum_precision": 0.13103000490181455, "rougeLsum_precision_stderr": 0.0018143737843109569, "rougeLsum_recall": 0.2109444720461656, "rougeLsum_recall_stderr": 0.0023822951303522515}}, "3": {"tldr_en": {"bleu": 1.4599914767802553, "bleu_stderr": 0.0635195569874681, "rouge1_fmeasure": 0.1342644995667986, "rouge1_fmeasure_stderr": 0.0019642297496972366, "rouge1_precision": 0.12509614688619689, "rouge1_precision_stderr": 0.002228795608935358, "rouge1_recall": 0.18767300213224564, "rouge1_recall_stderr": 0.0028539387200514476, "rouge2_fmeasure": 0.025820231326483496, "rouge2_fmeasure_stderr": 0.0007752810347348394, "rouge2_precision": 0.024250258441802567, "rouge2_precision_stderr": 0.0009026138649276358, "rouge2_recall": 0.037597498222217, "rouge2_recall_stderr": 0.0012860828030060772, "rougeL_fmeasure": 0.1073751120661638, "rougeL_fmeasure_stderr": 0.00149029795685705, "rougeL_precision": 0.0999116738568996, "rougeL_precision_stderr": 0.0017693027578086957, "rougeL_recall": 0.15265267010514852, "rougeL_recall_stderr": 0.0023328283894968257, "rougeLsum_fmeasure": 0.12525446512455207, "rougeLsum_fmeasure_stderr": 0.001822028086382638, "rougeLsum_precision": 0.11675484033349125, "rougeLsum_precision_stderr": 0.002089428868664697, "rougeLsum_recall": 0.17579490426422517, "rougeLsum_recall_stderr": 0.00269019117553292}}, "4": {"tldr_en": {"bleu": 0.3702833561251355, "bleu_stderr": 0.030351290737556852, "rouge1_fmeasure": 0.04622406565185966, "rouge1_fmeasure_stderr": 0.0016303591829101983, "rouge1_precision": 0.04485321962453146, "rouge1_precision_stderr": 0.0017875667294004294, "rouge1_recall": 0.06630548480377385, "rouge1_recall_stderr": 0.0024064841997783804, "rouge2_fmeasure": 0.009339471992932759, "rouge2_fmeasure_stderr": 0.0005238484713453825, "rouge2_precision": 0.008654276655755648, "rouge2_precision_stderr": 0.0005433398891243852, "rouge2_recall": 0.013973442151458024, "rouge2_recall_stderr": 0.0008607910239468982, "rougeL_fmeasure": 0.03817435899320631, "rougeL_fmeasure_stderr": 0.001315667296339476, "rougeL_precision": 0.03703928516688903, "rougeL_precision_stderr": 0.0014780279022334575, "rougeL_recall": 0.05553695501709392, "rougeL_recall_stderr": 0.0020162336010684924, "rougeLsum_fmeasure": 0.04244591804424164, "rougeLsum_fmeasure_stderr": 0.0014960454994858057, "rougeLsum_precision": 0.04131778962417704, "rougeLsum_precision_stderr": 0.0016612472366310286, "rougeLsum_recall": 0.061078533602158244, "rougeLsum_recall_stderr": 0.0022269504871210042}}, "5": {"tldr_en": {"bleu": 1.0605881261031538e-06, "bleu_stderr": 1.8732681876015495e-06, "rouge1_fmeasure": 0.007838938488476992, "rouge1_fmeasure_stderr": 0.0007592053204344529, "rouge1_precision": 0.007895152558976005, "rouge1_precision_stderr": 0.000844472965838446, "rouge1_recall": 0.011330805175563327, "rouge1_recall_stderr": 0.0011068236259164767, "rouge2_fmeasure": 0.0017395393632540774, "rouge2_fmeasure_stderr": 0.00022581320583642028, "rouge2_precision": 0.001828752443277852, "rouge2_precision_stderr": 0.0002833369118955633, "rouge2_recall": 0.002712234792676449, "rouge2_recall_stderr": 0.00040657012932559535, "rougeL_fmeasure": 0.006459264593320741, "rougeL_fmeasure_stderr": 0.0006146390001712349, "rougeL_precision": 0.006451660866714186, "rougeL_precision_stderr": 0.0006761070510151714, "rougeL_recall": 0.009434380372514109, "rougeL_recall_stderr": 0.0009165354870618827, "rougeLsum_fmeasure": 0.007176068947718324, "rougeLsum_fmeasure_stderr": 0.0006890108922026801, "rougeLsum_precision": 0.007220742560238168, "rougeLsum_precision_stderr": 0.0007677030305742829, "rougeLsum_recall": 0.010470405484261038, "rougeLsum_recall_stderr": 0.0010219886346664543}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 1.0756224564831869, "bleu_stderr": 0.064362467364649, "rouge1_fmeasure": 0.11475475475567845, "rouge1_fmeasure_stderr": 0.0016267727810947243, "rouge1_precision": 0.2588235923286985, "rouge1_precision_stderr": 0.004562924193018284, "rouge1_recall": 0.09771851611832182, "rouge1_recall_stderr": 0.0018076944872090492, "rouge2_fmeasure": 0.017364866430399792, "rouge2_fmeasure_stderr": 0.0006257195214464453, "rouge2_precision": 0.07095225790843339, "rouge2_precision_stderr": 0.004012167691904306, "rouge2_recall": 0.018594174934204018, "rouge2_recall_stderr": 0.000789200672023998, "rougeL_fmeasure": 0.10751161947929294, "rougeL_fmeasure_stderr": 0.0015525911247785784, "rougeL_precision": 0.24270724404000282, "rougeL_precision_stderr": 0.004446165912080725, "rougeL_recall": 0.09270329159251155, "rougeL_recall_stderr": 0.001777052888516187, "rougeLsum_fmeasure": 0.1043086079779956, "rougeLsum_fmeasure_stderr": 0.001501216899123504, "rougeLsum_precision": 0.24212046048078248, "rougeLsum_precision_stderr": 0.004500843067139839, "rougeLsum_recall": 0.08721014170888262, "rougeLsum_recall_stderr": 0.0015860867044055972}}, "1": {"generate_text_restaurant": {"bleu": 5.6340703914383115, "bleu_stderr": 0.07802081757825902, "rouge1_fmeasure": 0.3364924250714533, "rouge1_fmeasure_stderr": 0.0019671670892094355, "rouge1_precision": 0.3496844195497873, "rouge1_precision_stderr": 0.0030957066657378565, "rouge1_recall": 0.4061353589201485, "rouge1_recall_stderr": 0.003002747367144736, "rouge2_fmeasure": 0.132388948988302, "rouge2_fmeasure_stderr": 0.0014487165943513271, "rouge2_precision": 0.13845324209640059, "rouge2_precision_stderr": 0.0019371833648373655, "rouge2_recall": 0.1632725866215026, "rouge2_recall_stderr": 0.001973962532025402, "rougeL_fmeasure": 0.242613336164728, "rougeL_fmeasure_stderr": 0.0015890115418894523, "rougeL_precision": 0.2545418793110184, "rougeL_precision_stderr": 0.002536135977755477, "rougeL_recall": 0.29266138157442667, "rougeL_recall_stderr": 0.002359605268115721, "rougeLsum_fmeasure": 0.278605840076953, "rougeLsum_fmeasure_stderr": 0.0018385587325905528, "rougeLsum_precision": 0.2888554888362579, "rougeLsum_precision_stderr": 0.002735901233949605, "rougeLsum_recall": 0.3379353521201237, "rougeLsum_recall_stderr": 0.0027651147680515984}}, "2": {"generate_text_restaurant": {"bleu": 5.742107948398635, "bleu_stderr": 0.10028477164759789, "rouge1_fmeasure": 0.3384601198644487, "rouge1_fmeasure_stderr": 0.0018343529202461447, "rouge1_precision": 0.29565325420243477, "rouge1_precision_stderr": 0.002453588842828844, "rouge1_recall": 0.4646488423809536, "rouge1_recall_stderr": 0.0027682272923222795, "rouge2_fmeasure": 0.1419143590408358, "rouge2_fmeasure_stderr": 0.0013500831164610805, "rouge2_precision": 0.12425161790639815, "rouge2_precision_stderr": 0.0015558836535121063, "rouge2_recall": 0.19872852519022988, "rouge2_recall_stderr": 0.0020164549706803304, "rougeL_fmeasure": 0.24356776108805483, "rougeL_fmeasure_stderr": 0.0014311711089907218, "rougeL_precision": 0.2129530997072588, "rougeL_precision_stderr": 0.0019300729133295007, "rougeL_recall": 0.3366936529804091, "rougeL_recall_stderr": 0.0022835557117666257, "rougeLsum_fmeasure": 0.2851684134761103, "rougeLsum_fmeasure_stderr": 0.0017343585089839761, "rougeLsum_precision": 0.24845067554530403, "rougeLsum_precision_stderr": 0.0021647527757715974, "rougeLsum_recall": 0.3927861198246419, "rougeLsum_recall_stderr": 0.0026411848326427685}}, "3": {"generate_text_restaurant": {"bleu": 6.4394699721339945, "bleu_stderr": 0.09285202216690835, "rouge1_fmeasure": 0.3506865804173511, "rouge1_fmeasure_stderr": 0.001779876639899985, "rouge1_precision": 0.29243082212800253, "rouge1_precision_stderr": 0.002007031392393103, "rouge1_recall": 0.48658038595985936, "rouge1_recall_stderr": 0.0026693414154091597, "rouge2_fmeasure": 0.14866896202149463, "rouge2_fmeasure_stderr": 0.0013547963115074187, "rouge2_precision": 0.12274569253499107, "rouge2_precision_stderr": 0.0012683595348881287, "rouge2_recall": 0.21168968767895338, "rouge2_recall_stderr": 0.002098325368391887, "rougeL_fmeasure": 0.25402678782725335, "rougeL_fmeasure_stderr": 0.001368780824274314, "rougeL_precision": 0.2109600351766481, "rougeL_precision_stderr": 0.001491743890572953, "rougeL_recall": 0.3561629922763884, "rougeL_recall_stderr": 0.002290230370810661, "rougeLsum_fmeasure": 0.2983343530741974, "rougeLsum_fmeasure_stderr": 0.0017256887817233195, "rougeLsum_precision": 0.24846793909198966, "rougeLsum_precision_stderr": 0.0018381867412554272, "rougeLsum_recall": 0.41481465361399206, "rougeLsum_recall_stderr": 0.0025983611700810586}}, "4": {"generate_text_restaurant": {"bleu": 6.654273843780829, "bleu_stderr": 0.0932390666677247, "rouge1_fmeasure": 0.3528059349016549, "rouge1_fmeasure_stderr": 0.0018000619625855965, "rouge1_precision": 0.2898424902183153, "rouge1_precision_stderr": 0.0018791763712852315, "rouge1_recall": 0.4929161644601487, "rouge1_recall_stderr": 0.0026458279648224167, "rouge2_fmeasure": 0.15067447176529838, "rouge2_fmeasure_stderr": 0.0013670254769562427, "rouge2_precision": 0.12270875266797653, "rouge2_precision_stderr": 0.0012167312451751447, "rouge2_recall": 0.21534342954879904, "rouge2_recall_stderr": 0.002091583190898679, "rougeL_fmeasure": 0.25852736725378506, "rougeL_fmeasure_stderr": 0.001401625539515259, "rougeL_precision": 0.2113572265707145, "rougeL_precision_stderr": 0.0013806305214041975, "rougeL_recall": 0.3649431060660491, "rougeL_recall_stderr": 0.0023133142967620376, "rougeLsum_fmeasure": 0.3015553223695305, "rougeLsum_fmeasure_stderr": 0.0017613480944054503, "rougeLsum_precision": 0.2474150705640244, "rougeLsum_precision_stderr": 0.0017363350028745841, "rougeLsum_recall": 0.42231678078769985, "rougeLsum_recall_stderr": 0.0026287105060156485}}, "5": {"generate_text_restaurant": {"bleu": 6.802357053111681, "bleu_stderr": 0.07951699425220059, "rouge1_fmeasure": 0.3535514791757511, "rouge1_fmeasure_stderr": 0.0017635886054965901, "rouge1_precision": 0.28820052977309235, "rouge1_precision_stderr": 0.001819335493032039, "rouge1_recall": 0.4993875209074646, "rouge1_recall_stderr": 0.0026615979174856954, "rouge2_fmeasure": 0.15104186792993882, "rouge2_fmeasure_stderr": 0.0013321860839076213, "rouge2_precision": 0.12189364791898503, "rouge2_precision_stderr": 0.0011831105686679357, "rouge2_recall": 0.21913595621439114, "rouge2_recall_stderr": 0.002096881385232064, "rougeL_fmeasure": 0.25938421101288645, "rougeL_fmeasure_stderr": 0.001370532445107939, "rougeL_precision": 0.21046833185620123, "rougeL_precision_stderr": 0.0013409452808175167, "rougeL_recall": 0.3703034038335145, "rougeL_recall_stderr": 0.002340534182475654, "rougeLsum_fmeasure": 0.30345160047433223, "rougeLsum_fmeasure_stderr": 0.0017236299574653685, "rougeLsum_precision": 0.24705433680949515, "rougeLsum_precision_stderr": 0.0016874826622658786, "rougeLsum_recall": 0.4296857608506914, "rougeLsum_recall_stderr": 0.0026271257379257085}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.3878211321327552, "bleu_stderr": 0.0855819143667016, "rouge1_fmeasure": 0.18386318990595807, "rouge1_fmeasure_stderr": 0.0023608331228326847, "rouge1_precision": 0.1319584869435511, "rouge1_precision_stderr": 0.0017902371313440575, "rouge1_recall": 0.31843751119441815, "rouge1_recall_stderr": 0.004065977532742336, "rouge2_fmeasure": 0.0374406012181181, "rouge2_fmeasure_stderr": 0.0013279313692357727, "rouge2_precision": 0.026550837358487143, "rouge2_precision_stderr": 0.0009488542686212192, "rouge2_recall": 0.06687473448752221, "rouge2_recall_stderr": 0.002449110168641438, "rougeL_fmeasure": 0.14334972946860364, "rougeL_fmeasure_stderr": 0.0017554946172280554, "rougeL_precision": 0.10262840876555364, "rougeL_precision_stderr": 0.0013137229936401066, "rougeL_recall": 0.25005919357583545, "rougeL_recall_stderr": 0.0032044045017060904, "rougeLsum_fmeasure": 0.14367399097871014, "rougeLsum_fmeasure_stderr": 0.0019591856753464845, "rougeLsum_precision": 0.10286501129146305, "rougeLsum_precision_stderr": 0.001455767441117724, "rougeLsum_recall": 0.2505082141618244, "rougeLsum_recall_stderr": 0.003526620853397989}}, "1": {"article_DOC_summary": {"bleu": 0.8832546884814032, "bleu_stderr": 0.058811836402674386, "rouge1_fmeasure": 0.1439882099204442, "rouge1_fmeasure_stderr": 0.0021362210922445256, "rouge1_precision": 0.1019316787156134, "rouge1_precision_stderr": 0.001581412043974921, "rouge1_recall": 0.25568536664121694, "rouge1_recall_stderr": 0.003700241675446601, "rouge2_fmeasure": 0.022185877818879655, "rouge2_fmeasure_stderr": 0.001068255036385278, "rouge2_precision": 0.015540487617390818, "rouge2_precision_stderr": 0.0007529217251141928, "rouge2_recall": 0.040635472267349405, "rouge2_recall_stderr": 0.0020138507639145733, "rougeL_fmeasure": 0.115878171942197, "rougeL_fmeasure_stderr": 0.001626602377075275, "rougeL_precision": 0.08189228355883127, "rougeL_precision_stderr": 0.001197668399441684, "rougeL_recall": 0.20681340108359003, "rougeL_recall_stderr": 0.0029102146053896064, "rougeLsum_fmeasure": 0.1155841559891562, "rougeLsum_fmeasure_stderr": 0.0017520660679357471, "rougeLsum_precision": 0.08167666249359884, "rougeLsum_precision_stderr": 0.0012870273117968705, "rougeLsum_recall": 0.20631942492572855, "rougeLsum_recall_stderr": 0.0031137041096314646}}, "2": {"article_DOC_summary": {"bleu": 0.7747833335044035, "bleu_stderr": 0.0735019876667231, "rouge1_fmeasure": 0.14583874695098636, "rouge1_fmeasure_stderr": 0.002065306633050135, "rouge1_precision": 0.10290215824360217, "rouge1_precision_stderr": 0.0015231953673864073, "rouge1_recall": 0.26058699720865636, "rouge1_recall_stderr": 0.0035894470214097272, "rouge2_fmeasure": 0.021091747556253763, "rouge2_fmeasure_stderr": 0.0009730085187477109, "rouge2_precision": 0.014737945386577267, "rouge2_precision_stderr": 0.0006786127154562599, "rouge2_recall": 0.038568668595477, "rouge2_recall_stderr": 0.001838244973766507, "rougeL_fmeasure": 0.11670562169943377, "rougeL_fmeasure_stderr": 0.0015709631453015703, "rougeL_precision": 0.08227413818990617, "rougeL_precision_stderr": 0.0011579755263600813, "rougeL_recall": 0.20926439309232098, "rougeL_recall_stderr": 0.002780994834995758, "rougeLsum_fmeasure": 0.11667262595327746, "rougeLsum_fmeasure_stderr": 0.0016928169860876325, "rougeLsum_precision": 0.08215243516848891, "rougeLsum_precision_stderr": 0.0012349033736966245, "rougeLsum_recall": 0.20976643212478632, "rougeLsum_recall_stderr": 0.0030372441678568622}}, "3": {"article_DOC_summary": {"bleu": 0.7090873399844934, "bleu_stderr": 0.06349488292701568, "rouge1_fmeasure": 0.13973819965273176, "rouge1_fmeasure_stderr": 0.002224503682788521, "rouge1_precision": 0.10120153706706152, "rouge1_precision_stderr": 0.0017736330055289858, "rouge1_recall": 0.24519867618515012, "rouge1_recall_stderr": 0.003884692967238667, "rouge2_fmeasure": 0.019151399470871626, "rouge2_fmeasure_stderr": 0.0009352465834774729, "rouge2_precision": 0.013495672385084116, "rouge2_precision_stderr": 0.0006604205765928289, "rouge2_recall": 0.03480405814644667, "rouge2_recall_stderr": 0.0017521611060424783, "rougeL_fmeasure": 0.11223173860379815, "rougeL_fmeasure_stderr": 0.0016815182785500226, "rougeL_precision": 0.08110610044359444, "rougeL_precision_stderr": 0.0013403478299354114, "rougeL_recall": 0.19805114955706876, "rougeL_recall_stderr": 0.003043793566262139, "rougeLsum_fmeasure": 0.11137976210396107, "rougeLsum_fmeasure_stderr": 0.0017894136517198234, "rougeLsum_precision": 0.08047900097695888, "rougeLsum_precision_stderr": 0.0014125980225232948, "rougeLsum_recall": 0.19685244716798667, "rougeLsum_recall_stderr": 0.0032305682822595357}}, "4": {"article_DOC_summary": {"bleu": 0.36966928598813426, "bleu_stderr": 0.07413204217069384, "rouge1_fmeasure": 0.03868164502577274, "rouge1_fmeasure_stderr": 0.00218983828011114, "rouge1_precision": 0.033726207169633135, "rouge1_precision_stderr": 0.0022496434684974704, "rouge1_recall": 0.06113232730210851, "rouge1_recall_stderr": 0.0035415467033274375, "rouge2_fmeasure": 0.005136520819314499, "rouge2_fmeasure_stderr": 0.0005785064861652664, "rouge2_precision": 0.0039452222901913215, "rouge2_precision_stderr": 0.00047080278624595537, "rouge2_recall": 0.008587166126189389, "rouge2_recall_stderr": 0.000991502763473968, "rougeL_fmeasure": 0.031102614205213132, "rougeL_fmeasure_stderr": 0.001750893236380802, "rougeL_precision": 0.027341393262343253, "rougeL_precision_stderr": 0.0018583846671984688, "rougeL_recall": 0.0490770784043296, "rougeL_recall_stderr": 0.002826446970390225, "rougeLsum_fmeasure": 0.031460267393699226, "rougeLsum_fmeasure_stderr": 0.0017703108056970776, "rougeLsum_precision": 0.027572756891097318, "rougeLsum_precision_stderr": 0.0018634013892600786, "rougeLsum_recall": 0.04978804160990521, "rougeLsum_recall_stderr": 0.002882491425762946}}, "5": {"article_DOC_summary": {"bleu": 3.696651377011743e-40, "bleu_stderr": 4.625530268515257e-36, "rouge1_fmeasure": 0.002116700789094782, "rouge1_fmeasure_stderr": 0.0005901490166052325, "rouge1_precision": 0.002416790871504932, "rouge1_precision_stderr": 0.000690024976317744, "rouge1_recall": 0.0020318495670589333, "rouge1_recall_stderr": 0.000586319326403082, "rouge2_fmeasure": 0.00012903395324011984, "rouge2_fmeasure_stderr": 7.455004604564479e-05, "rouge2_precision": 0.00016686975621492826, "rouge2_precision_stderr": 9.709108848912936e-05, "rouge2_recall": 0.0001078167115902965, "rouge2_recall_stderr": 6.282744363562356e-05, "rougeL_fmeasure": 0.001471166405296428, "rougeL_fmeasure_stderr": 0.00040793599808869183, "rougeL_precision": 0.0017258055760596795, "rougeL_precision_stderr": 0.0004998666139598835, "rougeL_recall": 0.0013501651107790925, "rougeL_recall_stderr": 0.00036589324228248303, "rougeLsum_fmeasure": 0.0016630690627148653, "rougeLsum_fmeasure_stderr": 0.00044252995979777765, "rougeLsum_precision": 0.0019222911396811744, "rougeLsum_precision_stderr": 0.0005311080623757342, "rougeLsum_recall": 0.001572836788867691, "rougeLsum_recall_stderr": 0.00042709396031823143}}}} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..39264440e951ad97830574504115bb5fa21edd3c --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.28572015895181313, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.029996683677028884 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06275107464568752, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001482626784800971 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2653496514419625, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0044301076161033445 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09566430048114055, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019833726857373933 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03009186338419653, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009122332803552036 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1306746149712155, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003040441899500505 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.045926667677568665, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012416071370673657 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06029258655079738, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013643648691810868 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.25861360612073325, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004336001927934783 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09229607491866483, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018548951773486634 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0599952987639967, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013920010929440471 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.25468022554337166, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00416218635602354 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.0914984902210792, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018580702167419888 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..4a33916db382fe754ef413c879678b38982473d0 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.2733809666843245, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.017469945535516233 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06127827669468516, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014475626789825216 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2912358718895091, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0047559174768431 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09465272634611742, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018532707516154 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.028424762596691282, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009872409719648724 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.13634361210693505, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0031518261028729865 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.043447331936707745, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011595853852308454 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05798019246549793, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013348612234876421 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2756227919098518, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004404790096916205 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08967525096022803, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017040144863156993 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0584971868634523, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001386020107167148 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2763902169531308, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004392872739454734 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09023227224081035, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017566163632365401 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..1c7cec5e406eb2ea775852df47404f49c1d4b4a6 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.27692663560456576, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.020364718206970903 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06147368851457221, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012623013185335313 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.30263039971208694, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004760584060971739 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09625717915221209, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00174014878444931 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.028063334403907188, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007662392196332797 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.14354815751347613, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032059165700188356 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.044005340063557, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010837646169888715 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05786141529156912, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011333739480816865 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.286302289137813, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004385346387690765 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.0907708660179587, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015736293804571027 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.058721463920226806, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012062193203122612 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.287696314630283, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004428617061773817 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09187344007508645, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016563753568251043 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..234675adf3fa26063d8857a76297020d2c11099e --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.29659125910672235, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.016882600262624867 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06145887932212597, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012169314124561455 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.30505300258942414, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0047261670100499364 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09650412351241988, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00167247613646195 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.027901257259455022, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007085509669261345 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.14687843284043367, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032247187337236904 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04405862636243696, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010210491782955636 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05816779259264925, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001101022422405542 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2897233872600757, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004365094346814999 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09147131174467073, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015248452457480056 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.058548171185912525, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011357565151254563 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2895152165474746, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004340778368401744 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09190353821219928, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015652081391078101 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..f8b07798c133515c632ed1db6e7fa3df436eb98d --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.32349384025701167, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.021841302866309788 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0625728361410853, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012585041311395817 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3094168818387454, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004729097260215436 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09824537940970629, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017168314347721003 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.028682921178866484, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007563993720637289 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.15044042342708142, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003333834053934159 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.0452158613394661, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010697836859867177 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.059023081811736294, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011089492079030946 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.29435917450238935, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0044243064370870335 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09288695263220921, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015312884011513372 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.05982186254258612, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011713233210840226 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2960727424843719, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004432691110581699 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09395763356452147, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016024157843164731 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..57476838acee1b9b67c9ebbf141a8296ed6d8d4a --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3317247520236422, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02438683801110983 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06471426127247473, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0012898743879850927 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3220301197483266, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004784458908262577 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1015968420316754, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017067334576059984 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.029766999027414025, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008118603022394101 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.15682390612074046, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0033732274141397736 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04683784475546268, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010906780700661233 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06064903145944483, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011531567240369417 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.30378656882887267, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004419672235023449 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09534760210410158, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001533464120564557 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.061657852757433344, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012078523776645487 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3073326718000021, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004475310017341517 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.0967982427270365, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015966272469230514 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..f8a2638a6ae415303cf16a0b78c25a4daa757756 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.13780680503285866, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001963222074069445 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2300113800580128, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0027523450735060214 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.15995178659481124, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019476998067523457 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.027958971164094862, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007185096475725596 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04802627198798666, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012953632843939321 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0325449603413564, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007946537089430446 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10894258616198119, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014095848399899374 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.18869266341630972, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022499271779208518 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12806903787214233, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001432165288725186 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.12619303410814398, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017830267623956222 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2118167894154195, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0025399740287383532 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.14672463644520317, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017705329316914052 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.4715584716266366, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05979035173894537 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..d4959123f0c4711d037cc2612d838f5ca04189ba --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.14303855949220973, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0017883259547811035 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2404640566053214, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0025568167624806268 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1659619521945487, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017255813810933987 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0247139355641883, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006686054027706484 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.043281756890626494, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012894489706408074 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.02872278229177072, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007406492584205885 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10120656325023195, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011799928185521268 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.17663608162711542, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0019540696402957683 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.11865039810855227, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0011448070269801268 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.133863409884033, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016645742544581718 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.22590717474478603, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0024041420866198616 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15546750970375475, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016049368612675332 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.4105754686734944, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05004327536852838 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d9c5f7b1e21fa7e06112ed58a8e82cb2b2465aca --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1405364837901601, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001939748022665139 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.22575505407910562, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002550117228501278 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1592319273466656, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001799066929060303 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.025662875444857295, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007691462288959418 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04175150895044056, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001189901549490804 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.028841983524197482, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007611631081205323 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1083364462309822, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001405789374506379 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.17872732097294958, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.001999408312244932 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12364040415407823, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012736531821000415 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13103000490181455, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018143737843109569 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2109444720461656, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0023822951303522515 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.14844491271068486, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016652808137804262 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.2900289618857925, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04780794942619469 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..3e471041545dc4bacf6bdf0a6de5ad6bb57bc141 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.12509614688619689, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002228795608935358 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.18767300213224564, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028539387200514476 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1342644995667986, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019642297496972366 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.024250258441802567, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009026138649276358 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.037597498222217, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012860828030060772 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.025820231326483496, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007752810347348394 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.0999116738568996, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0017693027578086957 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.15265267010514852, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0023328283894968257 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1073751120661638, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.00149029795685705 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.11675484033349125, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002089428868664697 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.17579490426422517, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00269019117553292 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.12525446512455207, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001822028086382638 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.4599914767802553, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0635195569874681 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..d648ac56bb8b7d81d163e349edca394f853684d2 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.04485321962453146, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0017875667294004294 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.06630548480377385, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0024064841997783804 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.04622406565185966, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016303591829101983 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.008654276655755648, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0005433398891243852 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.013973442151458024, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0008607910239468982 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.009339471992932759, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0005238484713453825 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.03703928516688903, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014780279022334575 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.05553695501709392, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0020162336010684924 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.03817435899320631, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001315667296339476 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.04131778962417704, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016612472366310286 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.061078533602158244, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0022269504871210042 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.04244591804424164, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0014960454994858057 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.3702833561251355, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.030351290737556852 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..35cfdcb6027c7753b9ff3593f9bab5287c260e09 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.007895152558976005, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.000844472965838446 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.011330805175563327, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0011068236259164767 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.007838938488476992, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0007592053204344529 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.001828752443277852, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0002833369118955633 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.002712234792676449, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00040657012932559535 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0017395393632540774, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00022581320583642028 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.006451660866714186, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0006761070510151714 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.009434380372514109, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0009165354870618827 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006459264593320741, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006146390001712349 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.007220742560238168, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0007677030305742829 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.010470405484261038, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0010219886346664543 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.007176068947718324, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0006890108922026801 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.0605881261031538e-06, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 1.8732681876015495e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..9daf1c665420608b308a28defd06104f5fbeb157 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 1.0756224564831869, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.064362467364649 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.2588235923286985, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.004562924193018284 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.09771851611832182, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0018076944872090492 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.11475475475567845, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0016267727810947243 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.07095225790843339, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.004012167691904306 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.018594174934204018, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.000789200672023998 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.017364866430399792, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0006257195214464453 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.24270724404000282, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.004446165912080725 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.09270329159251155, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.001777052888516187 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.10751161947929294, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015525911247785784 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.24212046048078248, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.004500843067139839 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.08721014170888262, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0015860867044055972 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.1043086079779956, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001501216899123504 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..5c6ac8162872988483b2f683936ed7a1d1ecc647 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.6340703914383115, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.07802081757825902 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3496844195497873, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0030957066657378565 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4061353589201485, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.003002747367144736 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3364924250714533, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0019671670892094355 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.13845324209640059, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0019371833648373655 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1632725866215026, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001973962532025402 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.132388948988302, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0014487165943513271 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2545418793110184, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002536135977755477 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.29266138157442667, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002359605268115721 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.242613336164728, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015890115418894523 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2888554888362579, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002735901233949605 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3379353521201237, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027651147680515984 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.278605840076953, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018385587325905528 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..ca6e049a269defb6e6e0ffa3ee86c1c48b1edcfa --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.742107948398635, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.10028477164759789 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.29565325420243477, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002453588842828844 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4646488423809536, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027682272923222795 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3384601198644487, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018343529202461447 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.12425161790639815, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0015558836535121063 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.19872852519022988, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0020164549706803304 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.1419143590408358, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0013500831164610805 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2129530997072588, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0019300729133295007 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3366936529804091, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022835557117666257 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.24356776108805483, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0014311711089907218 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.24845067554530403, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0021647527757715974 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3927861198246419, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026411848326427685 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2851684134761103, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017343585089839761 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..c2db8c18fb04077a61ffbb477428e1d47f44b047 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.4394699721339945, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.09285202216690835 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.29243082212800253, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002007031392393103 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.48658038595985936, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0026693414154091597 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3506865804173511, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.001779876639899985 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.12274569253499107, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0012683595348881287 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21168968767895338, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002098325368391887 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.14866896202149463, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0013547963115074187 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2109600351766481, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.001491743890572953 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3561629922763884, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002290230370810661 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.25402678782725335, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001368780824274314 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.24846793909198966, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0018381867412554272 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.41481465361399206, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025983611700810586 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2983343530741974, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017256887817233195 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..7ddc3ef47198a5dca21177caa03bdb493b6445e2 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.654273843780829, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.0932390666677247 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.2898424902183153, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0018791763712852315 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4929161644601487, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0026458279648224167 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3528059349016549, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018000619625855965 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.12270875266797653, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0012167312451751447 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21534342954879904, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002091583190898679 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.15067447176529838, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0013670254769562427 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2113572265707145, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0013806305214041975 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3649431060660491, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023133142967620376 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.25852736725378506, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001401625539515259 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2474150705640244, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0017363350028745841 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.42231678078769985, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026287105060156485 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3015553223695305, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017613480944054503 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b010d560fe9267cfeb0f9ae77e2e73a67d677a8c --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.802357053111681, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.07951699425220059 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.28820052977309235, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.001819335493032039 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4993875209074646, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0026615979174856954 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3535514791757511, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0017635886054965901 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.12189364791898503, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0011831105686679357 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21913595621439114, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002096881385232064 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.15104186792993882, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0013321860839076213 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.21046833185620123, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0013409452808175167 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3703034038335145, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002340534182475654 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.25938421101288645, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001370532445107939 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.24705433680949515, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0016874826622658786 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4296857608506914, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026271257379257085 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.30345160047433223, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017236299574653685 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_0.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..87de500852bfc61d36f13ef374da21435a4d080e --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1319584869435511, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017902371313440575 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.31843751119441815, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004065977532742336 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.18386318990595807, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0023608331228326847 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.026550837358487143, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009488542686212192 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06687473448752221, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002449110168641438 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0374406012181181, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0013279313692357727 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10262840876555364, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013137229936401066 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.25005919357583545, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0032044045017060904 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14334972946860364, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0017554946172280554 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10286501129146305, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001455767441117724 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2505082141618244, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003526620853397989 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14367399097871014, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019591856753464845 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.3878211321327552, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0855819143667016 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_1.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..83e39cfd40c95764bff4351a45abba83d966d9a8 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1019316787156134, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.001581412043974921 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.25568536664121694, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003700241675446601 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1439882099204442, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0021362210922445256 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.015540487617390818, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0007529217251141928 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.040635472267349405, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0020138507639145733 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.022185877818879655, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001068255036385278 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08189228355883127, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001197668399441684 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.20681340108359003, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0029102146053896064 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.115878171942197, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001626602377075275 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.08167666249359884, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0012870273117968705 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.20631942492572855, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0031137041096314646 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1155841559891562, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0017520660679357471 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.8832546884814032, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.058811836402674386 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_2.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..fda9a0545f6ca2c0d57f3b165e2ebd51b9aa995b --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.10290215824360217, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0015231953673864073 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.26058699720865636, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0035894470214097272 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.14583874695098636, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002065306633050135 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.014737945386577267, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0006786127154562599 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.038568668595477, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.001838244973766507 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.021091747556253763, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0009730085187477109 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08227413818990617, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0011579755263600813 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.20926439309232098, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002780994834995758 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.11670562169943377, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0015709631453015703 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.08215243516848891, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0012349033736966245 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.20976643212478632, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0030372441678568622 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.11667262595327746, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0016928169860876325 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.7747833335044035, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0735019876667231 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_3.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..8ab9eec79f76471fc69f0397986972c309fb7c2a --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.10120153706706152, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017736330055289858 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.24519867618515012, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003884692967238667 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.13973819965273176, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002224503682788521 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.013495672385084116, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0006604205765928289 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.03480405814644667, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0017521611060424783 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.019151399470871626, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0009352465834774729 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08110610044359444, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013403478299354114 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.19805114955706876, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003043793566262139 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.11223173860379815, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0016815182785500226 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.08047900097695888, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014125980225232948 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.19685244716798667, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0032305682822595357 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.11137976210396107, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0017894136517198234 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.7090873399844934, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.06349488292701568 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_4.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b2f92e7e75023f9c27a1ff23b9f7956ff0b2363e --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.033726207169633135, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0022496434684974704 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.06113232730210851, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0035415467033274375 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.03868164502577274, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.00218983828011114 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0039452222901913215, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00047080278624595537 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.008587166126189389, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.000991502763473968 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.005136520819314499, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0005785064861652664 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.027341393262343253, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0018583846671984688 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0490770784043296, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002826446970390225 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.031102614205213132, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001750893236380802 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.027572756891097318, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0018634013892600786 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.04978804160990521, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.002882491425762946 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.031460267393699226, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0017703108056970776 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.36966928598813426, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07413204217069384 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_5.json b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..6c735d5d2dceb6f62a435e42c7ec1f79ebcbd1ee --- /dev/null +++ b/1b121b21bc4seed4/evaluation/generation/slim.1b121b21bc4seed4_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.002416790871504932, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.000690024976317744 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0020318495670589333, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.000586319326403082 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.002116700789094782, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0005901490166052325 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.00016686975621492826, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 9.709108848912936e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0001078167115902965, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 6.282744363562356e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.00012903395324011984, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 7.455004604564479e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0017258055760596795, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0004998666139598835 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0013501651107790925, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.00036589324228248303 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.001471166405296428, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.00040793599808869183 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0019222911396811744, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0005311080623757342 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.001572836788867691, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.00042709396031823143 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0016630690627148653, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.00044252995979777765 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 3.696651377011743e-40, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 4.625530268515257e-36 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-1b1-21b-c4seeds/1b121b21bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_0.csv b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..0193dd4f9f7c6ce4f674e01d4e63fa176a887123 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.334,0.01492201952373296,0 +anli_r2,acc,0.339,0.014976758771620344,0 +anli_r3,acc,0.3333333333333333,0.013613950010225596,0 +arc_challenge,acc,0.21843003412969283,0.012074291605700978,0 +arc_challenge,acc_norm,0.26023890784982934,0.012821930225112563,0 +arc_easy,acc,0.5122053872053872,0.010256726235129004,0 +arc_easy,acc_norm,0.42887205387205385,0.010155440652900152,0 +boolq,acc,0.5152905198776758,0.008740964832224342,1 +cb,acc,0.5,0.06741998624632421,1 +cb,f1,0.31768388106416273,,1 +copa,acc,0.72,0.04512608598542127,0 +hellaswag,acc,0.3577972515435172,0.004783723798286502,0 +hellaswag,acc_norm,0.4344752041426011,0.00494674860827134,0 +piqa,acc,0.6936887921653971,0.010754970032367321,0 +piqa,acc_norm,0.6985854189336235,0.01070624824275376,0 +rte,acc,0.5306859205776173,0.03003973059219781,0 +sciq,acc,0.765,0.013414729030247126,0 +sciq,acc_norm,0.665,0.014933117490932568,0 +storycloze_2016,acc,0.6456440406199893,0.011061031791615486,0 +winogrande,acc,0.5185477505919495,0.014042813708888378,0 diff --git a/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_0.json b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_0.json new file mode 100644 index 0000000000000000000000000000000000000000..1574d20ff08f9df37d70ddc43fa6906e01dc9260 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.334, + "acc_stderr": 0.01492201952373296 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620344 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.013613950010225596 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.31768388106416273 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542127 + }, + "hellaswag": { + "acc": 0.3577972515435172, + "acc_stderr": 0.004783723798286502, + "acc_norm": 0.4344752041426011, + "acc_norm_stderr": 0.00494674860827134 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.5185477505919495, + "acc_stderr": 0.014042813708888378 + }, + "storycloze_2016": { + "acc": 0.6456440406199893, + "acc_stderr": 0.011061031791615486 + }, + "boolq": { + "acc": 0.5152905198776758, + "acc_stderr": 0.008740964832224342 + }, + "arc_easy": { + "acc": 0.5122053872053872, + "acc_stderr": 0.010256726235129004, + "acc_norm": 0.42887205387205385, + "acc_norm_stderr": 0.010155440652900152 + }, + "arc_challenge": { + "acc": 0.21843003412969283, + "acc_stderr": 0.012074291605700978, + "acc_norm": 0.26023890784982934, + "acc_norm_stderr": 0.012821930225112563 + }, + "sciq": { + "acc": 0.765, + "acc_stderr": 0.013414729030247126, + "acc_norm": 0.665, + "acc_norm_stderr": 0.014933117490932568 + }, + "piqa": { + "acc": 0.6936887921653971, + "acc_stderr": 0.010754970032367321, + "acc_norm": 0.6985854189336235, + "acc_norm_stderr": 0.01070624824275376 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_1.csv b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..8a67b329e3610a5ebd9a1ab2b3b84637e55ce80e --- /dev/null +++ b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.333,0.014910846164229871,0 +anli_r2,acc,0.34,0.014987482264363937,0 +anli_r3,acc,0.3258333333333333,0.01353542204341745,0 +arc_challenge,acc,0.22440273037542663,0.012191404938603836,0 +arc_challenge,acc_norm,0.2508532423208191,0.012668198621315433,0 +arc_easy,acc,0.5193602693602694,0.010252089491165512,0 +arc_easy,acc_norm,0.45075757575757575,0.010209906101011116,0 +boolq,acc,0.5055045871559632,0.008744525001616653,1 +cb,acc,0.5,0.06741998624632421,1 +cb,f1,0.35057471264367807,,1 +copa,acc,0.69,0.04648231987117316,0 +hellaswag,acc,0.35550687114120694,0.004776883632722616,0 +hellaswag,acc_norm,0.4334793865763792,0.004945424771611586,0 +piqa,acc,0.6974972796517954,0.010717199698083886,0 +piqa,acc_norm,0.691512513601741,0.010776164678037157,0 +rte,acc,0.5487364620938628,0.029953149241808943,0 +sciq,acc,0.792,0.012841374572096923,0 +sciq,acc_norm,0.744,0.013807775152234195,0 +storycloze_2016,acc,0.635489043292357,0.011129829820967815,0 +winogrande,acc,0.5256511444356748,0.014033980956108555,0 diff --git a/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_1.json b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_1.json new file mode 100644 index 0000000000000000000000000000000000000000..dd4f5c329ddac8025e00643e16c20b365a7487f6 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.333, + "acc_stderr": 0.014910846164229871 + }, + "anli_r2": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r3": { + "acc": 0.3258333333333333, + "acc_stderr": 0.01353542204341745 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.35057471264367807 + }, + "copa": { + "acc": 0.69, + "acc_stderr": 0.04648231987117316 + }, + "hellaswag": { + "acc": 0.35550687114120694, + "acc_stderr": 0.004776883632722616, + "acc_norm": 0.4334793865763792, + "acc_norm_stderr": 0.004945424771611586 + }, + "rte": { + "acc": 0.5487364620938628, + "acc_stderr": 0.029953149241808943 + }, + "winogrande": { + "acc": 0.5256511444356748, + "acc_stderr": 0.014033980956108555 + }, + "storycloze_2016": { + "acc": 0.635489043292357, + "acc_stderr": 0.011129829820967815 + }, + "boolq": { + "acc": 0.5055045871559632, + "acc_stderr": 0.008744525001616653 + }, + "arc_easy": { + "acc": 0.5193602693602694, + "acc_stderr": 0.010252089491165512, + "acc_norm": 0.45075757575757575, + "acc_norm_stderr": 0.010209906101011116 + }, + "arc_challenge": { + "acc": 0.22440273037542663, + "acc_stderr": 0.012191404938603836, + "acc_norm": 0.2508532423208191, + "acc_norm_stderr": 0.012668198621315433 + }, + "sciq": { + "acc": 0.792, + "acc_stderr": 0.012841374572096923, + "acc_norm": 0.744, + "acc_norm_stderr": 0.013807775152234195 + }, + "piqa": { + "acc": 0.6974972796517954, + "acc_stderr": 0.010717199698083886, + "acc_norm": 0.691512513601741, + "acc_norm_stderr": 0.010776164678037157 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_2.csv b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..2d53ca34a0746077ba21f014712bd9dd62d6595c --- /dev/null +++ b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.331,0.014888272588203941,0 +anli_r2,acc,0.35,0.015090650341444233,0 +anli_r3,acc,0.3333333333333333,0.013613950010225601,0 +arc_challenge,acc,0.2354948805460751,0.012399451855004755,0 +arc_challenge,acc_norm,0.24914675767918087,0.012639407111926435,0 +arc_easy,acc,0.5130471380471381,0.010256289925058447,0 +arc_easy,acc_norm,0.48442760942760943,0.010254806331961892,0 +boolq,acc,0.5155963302752293,0.008740799550176545,1 +cb,acc,0.48214285714285715,0.06737697508644648,1 +cb,f1,0.3219476744186046,,1 +copa,acc,0.72,0.04512608598542128,0 +hellaswag,acc,0.35351523600876317,0.004770838678356027,0 +hellaswag,acc_norm,0.4325831507667795,0.0049442159370214015,0 +piqa,acc,0.691512513601741,0.010776164678037159,0 +piqa,acc_norm,0.6887921653971708,0.010802263878045839,0 +rte,acc,0.5451263537906137,0.029973636495415255,0 +sciq,acc,0.824,0.01204861689859752,0 +sciq,acc_norm,0.774,0.013232501619085332,0 +storycloze_2016,acc,0.6317477284874399,0.01115382325853175,0 +winogrande,acc,0.5027624309392266,0.014052271211616441,0 diff --git a/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_2.json b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_2.json new file mode 100644 index 0000000000000000000000000000000000000000..3114f795498e9c3fb5f1e2b64f9b9e35afc26179 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.331, + "acc_stderr": 0.014888272588203941 + }, + "anli_r2": { + "acc": 0.35, + "acc_stderr": 0.015090650341444233 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.013613950010225601 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.06737697508644648, + "f1": 0.3219476744186046 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542128 + }, + "hellaswag": { + "acc": 0.35351523600876317, + "acc_stderr": 0.004770838678356027, + "acc_norm": 0.4325831507667795, + "acc_norm_stderr": 0.0049442159370214015 + }, + "rte": { + "acc": 0.5451263537906137, + "acc_stderr": 0.029973636495415255 + }, + "winogrande": { + "acc": 0.5027624309392266, + "acc_stderr": 0.014052271211616441 + }, + "storycloze_2016": { + "acc": 0.6317477284874399, + "acc_stderr": 0.01115382325853175 + }, + "boolq": { + "acc": 0.5155963302752293, + "acc_stderr": 0.008740799550176545 + }, + "arc_easy": { + "acc": 0.5130471380471381, + "acc_stderr": 0.010256289925058447, + "acc_norm": 0.48442760942760943, + "acc_norm_stderr": 0.010254806331961892 + }, + "arc_challenge": { + "acc": 0.2354948805460751, + "acc_stderr": 0.012399451855004755, + "acc_norm": 0.24914675767918087, + "acc_norm_stderr": 0.012639407111926435 + }, + "sciq": { + "acc": 0.824, + "acc_stderr": 0.01204861689859752, + "acc_norm": 0.774, + "acc_norm_stderr": 0.013232501619085332 + }, + "piqa": { + "acc": 0.691512513601741, + "acc_stderr": 0.010776164678037159, + "acc_norm": 0.6887921653971708, + "acc_norm_stderr": 0.010802263878045839 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_3.csv b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..27e1d452a704c01a5a4ca45c3825db92dff79898 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.313,0.01467127282297789,0 +anli_r2,acc,0.352,0.01511040450564867,0 +anli_r3,acc,0.3475,0.013751753243291852,0 +arc_challenge,acc,0.2226962457337884,0.012158314774829931,0 +arc_challenge,acc_norm,0.24914675767918087,0.012639407111926433,0 +arc_easy,acc,0.5147306397306397,0.010255329977562094,0 +arc_easy,acc_norm,0.47685185185185186,0.010248782484554473,0 +boolq,acc,0.5232415902140672,0.008735602208318562,1 +cb,acc,0.4107142857142857,0.06633634150359541,1 +cb,f1,0.28296670272869334,,1 +copa,acc,0.73,0.044619604333847394,0 +hellaswag,acc,0.35371439952200756,0.004771447244095127,0 +hellaswag,acc_norm,0.4373630750846445,0.004950472918523318,0 +piqa,acc,0.691512513601741,0.010776164678037155,0 +piqa,acc_norm,0.6953210010881393,0.010738889044325161,0 +rte,acc,0.5234657039711191,0.03006330041190266,0 +sciq,acc,0.81,0.012411851354816322,0 +sciq,acc_norm,0.771,0.013294199326613602,0 +storycloze_2016,acc,0.632816675574559,0.011147041781368648,0 +winogrande,acc,0.5169692186266772,0.014044390401612972,0 diff --git a/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_3.json b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a811562054180b88e5611b8fcb1babf3e719ab75 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.313, + "acc_stderr": 0.01467127282297789 + }, + "anli_r2": { + "acc": 0.352, + "acc_stderr": 0.01511040450564867 + }, + "anli_r3": { + "acc": 0.3475, + "acc_stderr": 0.013751753243291852 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.06633634150359541, + "f1": 0.28296670272869334 + }, + "copa": { + "acc": 0.73, + "acc_stderr": 0.044619604333847394 + }, + "hellaswag": { + "acc": 0.35371439952200756, + "acc_stderr": 0.004771447244095127, + "acc_norm": 0.4373630750846445, + "acc_norm_stderr": 0.004950472918523318 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.5169692186266772, + "acc_stderr": 0.014044390401612972 + }, + "storycloze_2016": { + "acc": 0.632816675574559, + "acc_stderr": 0.011147041781368648 + }, + "boolq": { + "acc": 0.5232415902140672, + "acc_stderr": 0.008735602208318562 + }, + "arc_easy": { + "acc": 0.5147306397306397, + "acc_stderr": 0.010255329977562094, + "acc_norm": 0.47685185185185186, + "acc_norm_stderr": 0.010248782484554473 + }, + "arc_challenge": { + "acc": 0.2226962457337884, + "acc_stderr": 0.012158314774829931, + "acc_norm": 0.24914675767918087, + "acc_norm_stderr": 0.012639407111926433 + }, + "sciq": { + "acc": 0.81, + "acc_stderr": 0.012411851354816322, + "acc_norm": 0.771, + "acc_norm_stderr": 0.013294199326613602 + }, + "piqa": { + "acc": 0.691512513601741, + "acc_stderr": 0.010776164678037155, + "acc_norm": 0.6953210010881393, + "acc_norm_stderr": 0.010738889044325161 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_4.csv b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..4bf569b717e7f39c31478117a8d83eda77086bd8 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.336,0.01494414023379502,0 +anli_r2,acc,0.343,0.015019206922356953,0 +anli_r3,acc,0.33666666666666667,0.013647602942406396,0 +arc_challenge,acc,0.22184300341296928,0.012141659068147891,0 +arc_challenge,acc_norm,0.25597269624573377,0.012753013241244516,0 +arc_easy,acc,0.5180976430976431,0.010253060653479173,0 +arc_easy,acc_norm,0.4861111111111111,0.010255824507190352,0 +boolq,acc,0.5238532110091743,0.008735097860690573,1 +cb,acc,0.4642857142857143,0.0672477765493766,1 +cb,f1,0.32551989421805505,,1 +copa,acc,0.69,0.04648231987117316,0 +hellaswag,acc,0.35461063533160725,0.004774174590205139,0 +hellaswag,acc_norm,0.4304919338777136,0.004941331215598556,0 +piqa,acc,0.6866158868335147,0.010822829929195496,0 +piqa,acc_norm,0.6838955386289445,0.010848148455700448,0 +rte,acc,0.555956678700361,0.029907396333795994,0 +sciq,acc,0.82,0.012155153135511965,0 +sciq,acc_norm,0.786,0.012975838021968774,0 +storycloze_2016,acc,0.6280064136825227,0.011177095517223677,0 +winogrande,acc,0.5240726124704025,0.014036189665395127,0 diff --git a/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_4.json b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_4.json new file mode 100644 index 0000000000000000000000000000000000000000..32e12fe0111c0e8adf341c024a24ce4721abcba4 --- /dev/null +++ b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.01494414023379502 + }, + "anli_r2": { + "acc": 0.343, + "acc_stderr": 0.015019206922356953 + }, + "anli_r3": { + "acc": 0.33666666666666667, + "acc_stderr": 0.013647602942406396 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.32551989421805505 + }, + "copa": { + "acc": 0.69, + "acc_stderr": 0.04648231987117316 + }, + "hellaswag": { + "acc": 0.35461063533160725, + "acc_stderr": 0.004774174590205139, + "acc_norm": 0.4304919338777136, + "acc_norm_stderr": 0.004941331215598556 + }, + "rte": { + "acc": 0.555956678700361, + "acc_stderr": 0.029907396333795994 + }, + "winogrande": { + "acc": 0.5240726124704025, + "acc_stderr": 0.014036189665395127 + }, + "storycloze_2016": { + "acc": 0.6280064136825227, + "acc_stderr": 0.011177095517223677 + }, + "boolq": { + "acc": 0.5238532110091743, + "acc_stderr": 0.008735097860690573 + }, + "arc_easy": { + "acc": 0.5180976430976431, + "acc_stderr": 0.010253060653479173, + "acc_norm": 0.4861111111111111, + "acc_norm_stderr": 0.010255824507190352 + }, + "arc_challenge": { + "acc": 0.22184300341296928, + "acc_stderr": 0.012141659068147891, + "acc_norm": 0.25597269624573377, + "acc_norm_stderr": 0.012753013241244516 + }, + "sciq": { + "acc": 0.82, + "acc_stderr": 0.012155153135511965, + "acc_norm": 0.786, + "acc_norm_stderr": 0.012975838021968774 + }, + "piqa": { + "acc": 0.6866158868335147, + "acc_stderr": 0.010822829929195496, + "acc_norm": 0.6838955386289445, + "acc_norm_stderr": 0.010848148455700448 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_5.csv b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..8a93fc9cb98fc900936685d4fe32ac71408d54ac --- /dev/null +++ b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.348,0.01507060460376841,0 +anli_r2,acc,0.348,0.015070604603768408,0 +anli_r3,acc,0.3441666666666667,0.013720551062295755,0 +arc_challenge,acc,0.22610921501706485,0.012224202097063286,0 +arc_challenge,acc_norm,0.24488054607508533,0.012566273985131356,0 +arc_easy,acc,0.5193602693602694,0.010252089491165515,0 +arc_easy,acc_norm,0.49242424242424243,0.010258605792153323,0 +boolq,acc,0.5220183486238532,0.008736571521997074,1 +cb,acc,0.6071428571428571,0.0658538889806635,1 +cb,f1,0.4143369175627239,,1 +copa,acc,0.75,0.04351941398892446,0 +hellaswag,acc,0.35620394343756223,0.004778978031389646,0 +hellaswag,acc_norm,0.4329814777932683,0.004944755230598372,0 +piqa,acc,0.6958650707290533,0.01073349333572132,0 +piqa,acc_norm,0.6844396082698585,0.010843119201758936,0 +rte,acc,0.5342960288808665,0.030025579819366426,0 +sciq,acc,0.837,0.01168621271274684,0 +sciq,acc_norm,0.804,0.01255952792670739,0 +storycloze_2016,acc,0.6360235168359166,0.011126343044992836,0 +winogrande,acc,0.5067087608524072,0.014051220692330352,0 diff --git a/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_5.json b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_5.json new file mode 100644 index 0000000000000000000000000000000000000000..f1a7ebd2b0c8fadbe5de0f614825d7e3a3abddda --- /dev/null +++ b/1b121b21bc4seed4/evaluation/rankeval/1b121b21bc4seed4_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.348, + "acc_stderr": 0.01507060460376841 + }, + "anli_r2": { + "acc": 0.348, + "acc_stderr": 0.015070604603768408 + }, + "anli_r3": { + "acc": 0.3441666666666667, + "acc_stderr": 0.013720551062295755 + }, + "cb": { + "acc": 0.6071428571428571, + "acc_stderr": 0.0658538889806635, + "f1": 0.4143369175627239 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.35620394343756223, + "acc_stderr": 0.004778978031389646, + "acc_norm": 0.4329814777932683, + "acc_norm_stderr": 0.004944755230598372 + }, + "rte": { + "acc": 0.5342960288808665, + "acc_stderr": 0.030025579819366426 + }, + "winogrande": { + "acc": 0.5067087608524072, + "acc_stderr": 0.014051220692330352 + }, + "storycloze_2016": { + "acc": 0.6360235168359166, + "acc_stderr": 0.011126343044992836 + }, + "boolq": { + "acc": 0.5220183486238532, + "acc_stderr": 0.008736571521997074 + }, + "arc_easy": { + "acc": 0.5193602693602694, + "acc_stderr": 0.010252089491165515, + "acc_norm": 0.49242424242424243, + "acc_norm_stderr": 0.010258605792153323 + }, + "arc_challenge": { + "acc": 0.22610921501706485, + "acc_stderr": 0.012224202097063286, + "acc_norm": 0.24488054607508533, + "acc_norm_stderr": 0.012566273985131356 + }, + "sciq": { + "acc": 0.837, + "acc_stderr": 0.01168621271274684, + "acc_norm": 0.804, + "acc_norm_stderr": 0.01255952792670739 + }, + "piqa": { + "acc": 0.6958650707290533, + "acc_stderr": 0.01073349333572132, + "acc_norm": 0.6844396082698585, + "acc_norm_stderr": 0.010843119201758936 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7958dfaba7be4be655fbc9efd549eb908b70a5f4 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5f7294ded12a379345619be86180687574dcae826e90e22ac23fa74b3ca9014 +size 51395415 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1ca140b0beab2edb7e46b9cfdb7913a99aa451c --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16abe58216bd738e38850e9a78c3c3fce283be55c8dbc211f2da397dcf50c2dc +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b3fc70e00cc7412c24f99f66a5e8bb988b4e586 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8574ec37c8b72024ad9651a23adb0d41441237653b86ce42aa2d69d85b720bc7 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41723477331dd640010c459f24a1fa3868f7f362 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd9c1853dcccafca9ec31894c04d971ea6433e2948ae9499cc4089befcdb522f +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b82cc2d4d58037df8f63df216447586e374ffed --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e059301e32ba2202608fe1042f373872ab213136edbc22d34b21038e6ae99c1 +size 51395565 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20feb3d0f79db6b97d255c1794f299161eef60e4 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45183590b695cb0f907906bf46d118e0b654c0408e799b92a3ec4a9283c1d9b9 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceb513f01e2060ee9e23810c992425351db40be5 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cf634dc97fcd268b55751ee9c03df3afbc5944a935daa21d06fe0266ce1e801 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48c8f732720a11bacefad05c4b6998d18b195fc8 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdd31925d91b009d0da6b42b0b2b2ffb568f052a6d5d1749604d441f3ffcc4e7 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f32a811991e937e0b7b1957730c0e3caee17bc8d --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a22e3fa94054eb3f9d055f53caaec320643041cc2136969c3f53f4d64256aea +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56000ff42af6eba1b27bd287e5878b2da95c9da4 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd583d761d6d409196058781300d102ae2c10e4dcca46c38a95d0ff3cdb8a650 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52add18dc2c012066c7d2ce8528066165d26bc79 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be3b4ca8686b1298a564af933c5df7381ede255e65912f5ad6aecb8265e48606 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..215fed568dcddf70bc7f691347e8fca8566c20f6 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45c8fe494bc9257ffeb7a60aa2acea68a7d9b25c3ef7ee5f06f760dad3e0e464 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..040a3010705684d3c7719a00411e295e43340bea --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:253b6834214360522ad70ae34a7a6bbbc6754c969cfe4411aed148f03e59fbd1 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c88ae11b011d5d351f9a3fddd6a2e62e38d0c0cc --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88754173b4be643269fd158dd7f2c451032fb8c3ca6857c9e5f4980f0761dd87 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85e0e81416c05f361b62dad97a9a2ac98cf9e9f2 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b42e9d086ec521babab8496cf13b21d2b966b6ab100cca2f96d7f8c518993ee +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad6b213fc737cf0a6f9660cfad2359cecf59ab00 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ef4e0ba2f14080cf81052a2a43dc77da390a21888cc4e50eb95cf9a971c4941 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee90b0451fb99350df26a41aabcf8dea7569207c --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8899f3c5b8df556c9fa4288a8886a7e698c350ea878853f30c272ed5ce512dd5 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c40add4e991c4b8f2edeb23b058fea668f585f7b --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:011ee815f87c3b2f73fda7a5c7ab35f255806e91cfc0ebbf34b514ec84832e0f +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a2bdbae82f9c6dcd2721e958cfe50a125f40422 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d5a89e26c399b8bc75ddff129797967e93c91ece12b9578db2d15f4f3f685e7 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00b8c44f59b0730c4abf8665eff4d0f62d784a6a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdc1a01c71884cd52e8b5308a6d10f5aadf5981571cc98a244b5c0a01f80b5d1 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6e02223f272242f32c4e0fc0e9fe8dfec17deb7 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f9a898ef90ef2fa098af7902b4c46b4f1373bde50fdfb3f5502ce9857056faf +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd84945f28cfd52c98a964ff32b273a0f4beed17 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa5ab896aee7c9b895b58be2973df6b8168d3bde852b5d625317d21f61a29548 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..699d89865b18f695d9f709daee129e3ad8931dff --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5dd64158b5913237a8ec9dc3603648f5ea42edbd7a7213be9df746f02c50c04 +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de85cd59cd257bb019c3a1adb1e47bbec9d8b741 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:688ff1cdd15bf4973ac64878748a326c1485f72d9ec41371be35c65f3beabed2 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb138972139c51b7bf53da22cc8ed20164fb8e63 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb27f48098497de9a12e8ebade5ef40cdc93464a5039631a926f38b521a8c29e +size 51395565 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5d8cb2ec498f696aff0f58cec5932b19c53caf0 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:764e01c6a1cddf6dc6a0d39fb2aa21d000fe5cd6dd4d960942269c20405e7af6 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd095a6ea6dc2f0549b893a78ffb695cd00a4bff --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:057beda562d2d3238de2391df362e7eba8e046845bbec598b244a58033d98698 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..893866f6bb9b6e61a7513cd97350da8087c727db --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5503c6476a4a6ee35395ef1060279501053edd63a6c3c82bd1048053450d5d28 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef64aad0eb599a3ca794cb457877534af714ebf9 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:541df58512d4bb5cc63852bdd0fae3b7799f507fb1286525a7228850f3e8d622 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4924e549d029d32e60363d1d35d26a750c3a771a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bbad19259886fb5d4b490c52cdd708563863b7531706365e01b1c110e9221ab +size 51395565 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdda9c5ea99c50b7ae527fea6e0b58fe42dbcf27 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dfbb07e463abf282eaa36eaeeb5d947a1e0a60f8fee98dec8a194c4cc4c5b55 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc88f8ba9db72825383f5d2dbb7c4a80b3fd4a61 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4e5f3b402b112fa5c1d5eda3b645ad6abd545045e4a42ec220ff04cfa184752 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf329cfbc31f7d69d4b9bffb6338a7ec98f68816 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:486964c1b027642baae8b6b074c10b7a7531f741900649cd900bff8d9728a1f6 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aaa8dfe5fcf3921faa60dcf2a4632d58ad29103c --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a22d0c27217e7f5984e60f4294e432e6227b296390b32702f1059d3142f3c18 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..721333584940f28033952ef09ee8038fbeffef8e --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:644a421ba888b292d3db054dcae151fc37baa013b8d2d309715bf35aea2f57b6 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c0785e2d51d7811b64fc3e802b89307d7a4e093 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b5bd725eba03015ff3f68f61fbf57ca5f1bed0545d01414665d230d36e869c5 +size 51395565 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3b54f113d1c52d648a481f7e35cfaa9fd2c631d --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d10a60a76f4273ba8495ece456af24c3f48356be6098d869b8f80954d8d9f56 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc78eb6be33021aa0cbaba19988075c35e47040d --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07774c4ac0a7853a56173410ff239f57ac78ba278c710eb1b993d792ae181094 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77d413f6b1924ef37d4e92375f8ff414c74a9bf8 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e0fe27528282deb1bfefd113de8abc290f6d63154c9a416be061f04763449ce +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ed9823f5464955103597f43f67b72d817629316 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f745e514febc0685f36bc68b5e5cca2194d6c56f9623424636c46dd32daa8735 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3393161ed136a66291b595b20c501b745a4d18c9 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2140f0636af3ccc1a9fa7044fb228885f314b34bee4a0484caa1eae2e8adf78b +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c559c7bb3bc854a8fd1749c08f33791fefa3e68 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28244e9eee63479049770cc285de054193b5270969d0b01abdf1c9cc58b4232a +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cfd786f462f24096d128a201803bef94d033af3 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de61e1d1139001ff3cecb7064cb58182c94dc3503f3cd1ec87a87158130c690a +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..510f91ea18a0cf2b39afb5143bc2e8312f298f77 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5b857b93e72502b5f518cc7567f726633a94c8488c646978d0ee482df098d46 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99dad7f6e4e2c3ce4cd1ad72400bcbdf4258cc76 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ce9fa2cb4ad2187a0589be211eec44d597cc79b702b331b587d3c4fe1ae4f3b +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07c86371a806b85d681fb9943accc4e939964b5c --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d592fd9133635924af0d0be48437a18569f03c425f34562104b41510a05369f9 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78b8900a125d864c5b65d1b373ff17b1611b1ba1 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfe625f6f1b3b6bd82cec0c5a18faa50e06e0cafb3af83ba0b1a496245a168a2 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2b6e2e4004cf735d8603d914084495e452185bf --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a79d057b0d8512e135caeead2b2ca32ccc0df57d6692f051c37e632098b8bec +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2384a617efe01e8888cb1656db1e48bfe4d8103a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9cc7692c985d768c586710a97e8373fcba7806b3f7ae7fd3c79468f7112f339 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..876e384c07c39a2665b5cf41295f9c1ad1c77367 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bf8b3f9b23ebe93a7dc39f49c1cf274d943bbbb235da6051772266545d10235 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a05463f38bed0d0bf029ceda662e2b4774414d9 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b606e605937fb2f7de331e1a71edde65952925db2c947f73f6c3145d732ebd3b +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f1dea64284a2740dc6844e9088616d141dd27d5 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:906f0a5001cf1163a0746345d563b38ebaa9116bb03f600d93fabd99269fbd24 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..902f4948495c2f440dc59fd238074d34bb96db4a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ffa9f19d16ce69ce2e86fe7cd958344f0af64d1ae53bbd3ac13d5e054c573d +size 51395565 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f28204a00318e8806ca72d585d8ffa625898592 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dc8a9e08ec60bd93a16d8ec5107154f9ab78db91a684e36206d2354d6b15301 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e379e44b1beb8f3e1d5e77f1af413e5857f6aa12 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a159f0090e0c4f72dc7e150aa38add0e3b02b8ff9da7e2468343b8f9d846aed +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..629e46d0c419a6a8c7a60f330399472603c05739 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b4f160454f93ec4a1aab8fc1aeeaf45a50dbe963d2c319d49b22a9bafa0281c +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79feaf735d8f41cad1ca088c4220334205c58a3c --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2ae9934672b3046e70608a751f20442be9c7120d079902728e0b546970c42e8 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f930e462cb3d2706ec945a417956728566b3e8c --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:234ddbec2cc0c3d2cae2a0688432ed98660bb79e494962fdecdf974199d1ae9d +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd87ca13b017274f8e9413431b88fdda2e76e34d --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c46ca4a220a5c8425ef79c6e9acc2340067b202af8e07ca636edefd072dc24c4 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f683ccf5ad967d9063aca8b1e44c01fa51fe5e12 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41ea31343b8baedc93967d2fc05ea6757cf8b56436b6302e726bcf64751b19de +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e39ea8e2733738ac5baea76c032f16ebffe9287 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e64a922d0214435fec42413e5bcf87334d00a165740af4a4163777fdeeb23d12 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0506635754e4e037e4d7307ae8bac890c0d08318 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e80a1fedcfbc47a12c9e317f1a0c6e3538ebc23d3f9859cffd2bba81009a0d7 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e2cc6fca7cf7fe9c9210a6299eca17e79cdf82e --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:083227f34576d6d7129a12a9c03c147b2be96a507860c7f092c901a278ed091a +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa4e5401a3763cac4557006e30b4f0157a341093 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c1f55267cbd26208c73a3fd5e519f4284e138850dbf68adc79185e0da09cc1e +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f11cb924d6657d94c64cd9030d5bf687e6106d5 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b08167e2802bbc942997130124b1ba561057eaa5afbcb2e43bf90b849481af1f +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f48f1adea3364b58fbe76561732aee8e46a17e6f --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8882916adf292cb6f92924e73f960e177bc281499f4e9df9db699d3f60396c5e +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f57d6590400e1d4d920f93d73b9981d4a85ef00 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47308aa170e4447381f0292a86cf3b61d24ba9b8a472e29c3fff7da076018983 +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7465b57bf1160aef05d862b4768252ee2788153 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16f4eb2eb225815ac72a7903e5b6860b1fc2271fa7cce80069e1cac2b06e1037 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16097b7af6b948ce6053b9d1ac582eac9a812a42 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c250cbfd4554558938f693499a3ac22cfb032d917c6ab232999e0d6f74c0065 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e90773b4a000bd301352abe461b730c78f4debaa --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9317e96a6d5447207e63432c787fe3cb7844b2df4c55d07a3ffbba0248831a74 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ae591e689eca8852ee0c56781f2d143a5b89266 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b438e31f01f04330df3e1250ab2863c24c5f7ae0d33350048d830402de47113 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3098ecbf851de9af81a0aba40a692cf9de76a4b --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:654896421ac54a46f30d2c67eff560c9c65792b83cb90994aa3898cb5f456ffa +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1880ef641458ecbe8d5c21eade338c3e4bc0b718 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aefcbec70c68fed0c8b8cae54cda696600b2df9f04800801d2c4f1cf130fd802 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8f61b5d1c3ea4ad258fb3d8b9ba55b566c213f3 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d47de9563d36c3c9922169c540679817ad6c6b2aab58c8eb94bd037d3c10cb +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6b4f82dfeeffe63854d02b8052ae7919643f6a1 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96344edd86915ed6d56fdc19c52566a9a2236989290c89aeb22294ee285ca37f +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ce91bb28586c3269dfb1fe9815b763263390758 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545c129284927e5388cf79e115e480068c3deb18637a3fd2ebc077f425ece5ec +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee6a117a96c31f14d532947340f3776d2d927b52 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73d610973929a3c5c28060fe662e01a4775dcc3bbb9e30c91c6cb1b7d6f234a6 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b3012e2202ed3b34c9f35f554568f11d57a7004 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e032f799d86eb776f8063ddae3d50d64a4fdb83014f0d40684ae66dc65ca7f5d +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de20d6c04e5ea711bad0e982ee5cc544cd4a0789 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:465ce23a0047b6900a5c06809f637f9b09bb9d34defa61934ae450fc617abb9e +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7092a6d0a9dc9e27450210a73dcb04bf98bb31ac --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:095a060c9b9c6275d42687c4e234afa01a6465cf32030e2317ad49448281739e +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff58427656886d02c354ba3768cb28161187b288 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf2f32cfe5f8660c5cd2e50687631b07e11dceb4ee43878ed50776ff7294a8f9 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6530e990bda086c256818f3e1e479c590037795 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:011708fb3053f5d2334018f5376141fdd6fafe47c0aa108843b0490d42ec64e2 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6893e9e3d49f773124557367bb99615c3f0722ab --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8acb751d6ec0e028836c959dbc75c38979f6309dc97bcaf27a30e10bbca7764 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5266ff16e0570dd1537d38c6b9516c6c2bde16e --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e66e914d2c93ddd54ac052a7a113bbd6ff929a64385abd1f7dea08f743304f2a +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbefc89e45fe6aba37ff3599437a033845203a74 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deda6637efb2cb8e4216168223eb626b4e464bcd635ca58191ed39274dca254c +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0a1fef36663778b879c0e124253eab7038cfe64 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:878e7b15427f4bc36f0bfd00f1727727549487a06e10eeea3cf39cbe1537fee6 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d230ed81ccf9af4deba4af7d2e93202e36e8baf --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a349321a8496d34254918a15e3cedfd2bf143fc2954f430fbee02d4640f8163d +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32a39531a3232c3d08bd408a97cff620931e075a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abe4621a58a84f9b5b4c9f2eeafd9218c34c9afdc227302da61cc32461af5730 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a44d4f8b2891cd70d228e32a89507f8ec6414148 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:186469ccd7b9f5c42aa50fefdaa65edb8afdf631ae65a77c235471d508615a69 +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6589892e50be6497451d80cbc1b09d30a6b49d5 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7cc8124555be7749c23a679ca301b6b47e63742b1cee7e029719259e530529c +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d23873cad0b25bb7492429bec1cc3b5b0656fff4 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63c9cab39e170317f4e84b88847d12fe71acdc7ad131fd4d7c4c766e83eff824 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e76904bbe4087aae53b9a5707bcefe097879925f --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb7f866734fe7731bee146c6ddc7f73bcfbbebdc3e75dc15174c67b0cb6b9d8d +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0855a1eeb67efc14ab075902a532220da14bcd5 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84f12aaec0e2cff5428350f6909d4fa53c0d076cc98e401d91d7d51c2058e2c8 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f31043b59a055496e1851a2ecba892e85f2cf103 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:382c8573f16869f606fb0c5aa4640d7c75940c6d9318afcb4cb136474ed03a60 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..071ae15dc05688fc3a2993493da77aaaa8c576df --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04fa51917fe22853d6f7e69af53ea8a02223b02067874aa6659552508853ed6f +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d20ebd2ae327d029d146c54df5dce3fda84fe5c7 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:481ac45045f87110c5bcc216b8a6698b9a3f9c240ebe421b0d9b1c55c67e04f2 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0557350bef69bd2f196d51d120bde02508dcba4d --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d13d846f71282a20165a8e41e443436a60a15f4738148641379c37ebffc5a64 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab3d15b6c4ca00ea9b0f53ade608a54df0e0170f --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41624181a4effea8a2cf6cfc54fad75a2a7f61c7fa849e8d247ab750741c8b9f +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e081d5291ec66742575a9aaacf0f2985108f293 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1f2b61636f199aa8680936da9a6c0284149f013a39ef4f6acca59bcd0f27301 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00b03262c37c60cf0b23bc2868402293c5cdd37c --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:376e16915924cf1f4af70b08234fe6bb4a5b08fb738c11b799e5fd0f08a2a1bd +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1537cf90c48fd9c73b4b334835801a54bf485a23 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e9bad7a60ea38d92f064dd587ec689c15f1e5fc6f262e18da51f700bee755b2 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83213ee4749f2a9d7f82fd92a5ecab7a20c2ba04 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b76d23c618cda6768d2564ac9a37b77e37b0033cb34b4e85376efc4303537211 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eb301724b9e6af2568263a0dc0c1d105ac58c45 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3692804aab3ac68c31d6dc2fcfc155a2012ddb4e058d91e9a76eb251896bc52f +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f733c3542549618c30173712483e34afb8bedcf0 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f46c2cdbd856e1346b02b0ca4e1744501a10a3af3db73e8bd1aa0b96805e05c4 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d5de9b95faf8c33bdd6ee0fae196b3b3a5678a7 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecb719c63bb7c67c8d54ad3c754a02b47392f592518f9b69523fe4a1252fc358 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0951e88d18c9d6b43ec50aa9356b79ba01b3d827 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9df7bd5cc0c06454e9c2b024b4680985bbc729345c6635f039cba19cb1502d +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a9e71af2e2ccd90005646bedb49662b8b24dbc5 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6b34d7086c1d18bfac17c915d24219e23f03d774245a506aa7caf0b19d4011c +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19802caabed0f40c3d5358ee6cbfce7511503f68 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ee5ab742677ed4e22a3bfd69865cf9ac812cca2b7266e28eb3e04bee52e9651 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19f8768a1a0efdbddd4a34759583158588359d72 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ad85722a2c00a7b86a96956519dce7d30fe31f3275af61200a004e5e4e2bd52 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f2557095b8cbd17bb57cbaf362d8b642e9d0c19 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5195b887510ae2b5ff04e1b0750333cfbd0c4b1813bbe9d7d94e6a408079882 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95e9e4966b64bc13a92810ab1e93d788c3b0a1ad --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7117905c3cb66f6290771666bb9db54eadfcbe0fa7e18fc162d9bc56a502b72f +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa9133616599fe9f33816b3a29c147ec7df22257 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:608d21476834b70263a5db22a61206ce05d999ff55b15b5ad79a2e03177fba7e +size 51395415 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b0de5fcedf28d07b51adc6a926fbbdae6caf28b --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edafe2b75757bf00f3eceaa6e257fb00b18d34f784e3688e1e84a778f95fc5bc +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da713fb3255b641d1978ff9fb887f643619c0e72 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9a41941dd8c942acb0d79811ba7879a4de03ef93a0aa4302fb92ac1a93dadf8 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..365dab9d38b3f693e607d4349c0a8fc939663ef2 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4d1f62f87b30cb1145cdbd4639f3d7448e5061ace038f80d13d3673f97aa972 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15206a5685545967e1a233cb9fbea4550ce40455 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d495fbe6b1371289c92717cd65db2e6ae80f9837d118d9efc41adfba83c5d6c8 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fc2711016e70179d941650705198894f476c82e --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cf047b38da6fbe4d4bd2efbd172e4a4e22eb368db918140c8f66bdede046359 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48b9b3cbdfc4edea47a269b429a270b2e776442a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60c1dc0d374046336f8e45129783c022c08182b96262bc291dd15adadb980ef8 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d63e879fe24a8d54cb3af4220d23a1279be3dbf --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68752e723cc63baeeed8aef47e57e1a8f02f67d870d0d9031aeab764548d80b0 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c06ee0e7c1839e3bb8b7215df3f5b0cd8558317 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcb1db9a952eb43ebc7be52dbc96556991ef6e7c53f7651fe560bd57b16160ea +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ecd2b9c7d4eddfdd0d524c2e789a67d281ee185 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bbce83b706868329636b661e8eede033c9745cf173f84dd256704ed63e388b9 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6307f995b25b51936ba053fda9e942c852562fb6 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a21dae9b73975cf4e054bd498e9c9da0192c9502c7d4c89ca48fc4ecf5d89d45 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0d47952bab3f7038c292f25c73b58c7d0803922 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c31500e4d6224cc0216b824b13782a8755240701ca3c815243a0015a6d9a47d2 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7629b32750bea133e91ea9a8db13ba51059fd711 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0015ab9c7d0ecc9f5d57f02d122ba8444cea9f28b6e2d09f24d86f45b713120 +size 51395565 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81636c938f1f3a0cfa587d95000d73adb52dd60b --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:795ed60c7d7601abfe193668c4ebcccf2daa28cfdf0b1caeb18f44ddb1873f39 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15661ddc75d774092fc4f87678185d9ffff6842e --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:560cd352ea7abfec79812e342f82db13fc4e0ec641d8ec84fce6a13c8f06a9f2 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c6a417e5eec18cfce77647960bfc32b1c77418a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3d7c615a543a36e6a5ea417ad4b9d0932f1259ba722875e60a725c77c1d1024 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcca047240cf5195705d50409a2a7b09fe320614 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6aaec9fe2eefeb01c2e72db6fedde5f01fb70706ce3faa8253dfded1ec4dab25 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95437cd697e21f7167ccc47266c7e86b546e3511 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:640e1d2152dbec60d5a5e236b281ec98ff1fd245fb5a2b82c32867bd9fa36785 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb59d2c6297d3f3ffccb4b875f53696117fc3e38 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfa5bc9dc9f0538de9af54ffb8f4a87af042f089915b4c93b05a66d712b52b5e +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..531361558ee6339438a908408ef36036de4ab66c --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:006af985aea066634d582b1728d6202cf5cdd4229f294ee3f8292ad40a60da04 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e15e9181168ddb97948e02a0c8ecbe8864aabbe3 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c46f103fef50e0d9caa06f6fa5b88bc37643321b26ea6dae311ef06db7efe2bc +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85e9f109f1967f1fae617680ae7fd33fa7022a8e --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ece4e6a534764bc6b0c9d728a3ac6d9894d5cc8380bb773721d24bf534220b5 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc3e2cf147bf1991a5a07545e56b9a067c0fa821 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:821e11b7d2c4ce789fd24e26de6fb81721a7296339406eb674cdbdd98eaebc7d +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63e07290865f8f08e153ce7322114ff4961f30e6 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69a54260ffa1371391fb7eda80f5d7f58a088829f35c4528df607a0f5ed02f3f +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc8502ef29d281a61cc709704441c1b1caab2025 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:286acdf32823ec7de95fe6fefa1e9050530115411b10c3febced85924f6fc485 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7db3efdf3b53e65c312dff1fdd673cd71d14aa4a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4497c7279529d9756caccd58d4dc9d009572c2baafe16e0dbe2c5592f9483ecb +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2be1501caf542f272c75d5422a1e618320505ef5 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eed4f52d1edcf12d5dce1478683db7ab30df1dc39365000de8f945a72d2daa5e +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38433535549e9c7fc2c8ab7707b02d9c767a710d --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:968b269d029eb34880a48170c9842497a3a2b727be1f335a778d7ebef23fd6f6 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cc7292e26fd5a105932584388cb966968a8c4a0 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c61d64d6f154babf0475f930a0ca4b21741fce6b6848345e88acd1c85c37a1c +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2333a87a883374d2dda7f9be45a524ed2f880e46 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7528b2ecd9b5c29cd9e5d37ded7024e2208c05f31b8b02924322ed27e38fe43 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f4255e4bb43b92362a6a2e7c8b640fa547224d0 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ded696db07d2596a64b3dad95015d5a92dbf26cfe5eec0621a6d11db4c77b69a +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fedbe3c08dbdfc2195a5c1f769918d459f499f4 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02600b4505f2577348f20641d013519a19dece1c38ef60445a251c9cde085c85 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b192fc7695bedccfc9d2400e4b9919916047c7b --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a756f194396f8972f27dc0254c2926098aae1c00a0f05b77785df70e547fdd8 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a3d783a85851035b5296901a69f80a5112284c6 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5c0ccfef33e4a060ba1d8dac31033fca00c2daedbc851601a84e3b694ba50dc +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e39f0bb19afdd89ddb5dd30cce9c32ccdd813c3 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:015321aecf39fc3ad046d4979b69dd4ca988ae95152bf01c81c826fe79082e94 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db19e9ed0a304e17750aa738e031f0288662e53e --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0619a7e4ad44fa0bbe2bf4ed5d8fe5d2b416e5c09df2b96d169b348a8103473a +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f56bc82dca76b15d04b50886852c3273c8eca0c4 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dddbf72b5dec1d1f170c4ebf67aa33dffafd04b62c55e885be21d1f421be81c +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f7c6f42cab320f002696d438102fc253d785d5d --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3c2603806379231be8a6da2e1a2a52cf402c1b66cbece23abd9ec571cd9d1eb +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a1d23248eb420ae2e775212acd9daac40c852d9 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9838baae197532804193b51b2d2ee1c2bfe94f468784061f9621dabc0e587706 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0e6e1a6f5eececc86b1d2df8576560f6f00c03d --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28c36d19d96b54207b39546e1cfca04ee7660bb4173d272c8cb8fce5f289e11a +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dbdf949f81c28f3751ae7fd1174f4155a1a4d00 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4ad9b9817c75d99a29bc3e4925497a32b6d814614be0b459e86ac6be77626d5 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cfe1302a5d793310dcb72a712d313c4daabc59a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ffc4b1148c72aaba81f46a5e41ed8ff776f442aefcce51b014c684b44d3dd12 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f231550c4f5caa86804458de5d8489152a6c9ecc --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9041cae0c180840ad4c2580acaffbcac2cc3f48e24f32ad47b564c35dbfc1ef7 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a86f39f9922d5e94a0e3b014fc563866c2bade8 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e69e89c62c82a844a3ce293eef463b5aeec7b2d8add49e3cc64a79fab9beadb +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22e2931f59ef789d09aa0b77d5a3c80f85a22b4a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3ddcfcd35d8f2d327283fa0e7410401ae57c1e5aa72792c6a9f2591270704c0 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd68ded7ea854f77dc90612d5af6e28ee813357e --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c96c9bf0a300a66ece0825a1e326da64dbc7f8fc7debcba91ab972126f2a31 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f964e84eafc9e11ff204d1b0c5e09b4df4fefe5d --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec4e7703678e772b8fce80094fda2ec2513c80fd9fd09f6073508188b9044742 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fe0c7259c2d6dd9915a97ea37bf08ec7d95f982 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75a5fdc0fa5a25702b66b371b8e9723e273924ac0655ace65f2bf24a60258b0d +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99152a96aff04e2c269b9e29ecfcde9c5d862d1a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9fc3ff3839ae626b4397f791f68f970f05a0e06f4712528fc8a8c16ce6886cb +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05ceb298fa6bbf56db2e393b22928ec641ea35f0 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75d4ff393818b57eb558a4ce3d04084dfcfb3c7e90a46d5d823f331f5ca50395 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..782256f2c0daeec5b56162af7d6e3e5400e852e7 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a07db1695d907dfaf31cf20c803aec3f9052139def42c2223dc4895c4f630d06 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fae8c831ef5bc8987a427e18cc178504eea70685 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:699e5c4fb11d3a90ed98b78390944e1c0613829354ff68c3d1dfb1e788d18836 +size 51395437 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51bedfd7f65eae4939d8a20efdf51413b7403b3f --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f6b1dfe9b45ed422598bc82e9a6b8d0501a1b4bf9ec8d9d81066fee34f942ad +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..767db2b74e90aac6c9243ebc31041a95fa1817ba --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41c75864926f4cd5d306be33edd19876924abb755ac8352f8677d41c7d56b201 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..afe9bdce8aa5b6190f1c952c2b07f854b8ade15f --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:049ae3dfaaafef5c1a39fadc7fcacb64662f6980ff4dba70c05cdd27b68eb730 +size 51395565 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42bf0ffc0aae8fc53ed1dfeb0ea10061a256d9f8 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6d07f642b3649cb931c0e8dff96657a2db3f8db80a180d9c11b86e0ece20847 +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02629322b7e29df08136485246acdfa372090ccd --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0fd1172d0c7c9d0724afbbb5f400561653f057e91222a7598f191012a1aadc9 +size 51395501 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..061c172218877ec09223eb060da76445531c9479 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ade56e15807aaab7f6d686a365583e623ba9c21762e8d4e6591913b7e0655044 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0db22235e39c43307723264ba09a80363e1db86f --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a9d39d2c914049a7bbc6834a31214aa33aa1d56670b34a3e1499f8903906182 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..441409b5f85e1f0e2f2288d6b6e9fd99248d4092 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eb8c026edbb491cb83ea044beb570ba61f362e7c2ae221e296110238fc9752b +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8a6b050aa3af437b2077ca90e5848471de49ad2 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545c75dcb6a4dc2db8ff901bf68c3d5b591b628c31042d7979edb2869bc8bd35 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..982bfc074ed5c7e7fc0664c47ed0ea4a3d371987 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3757ee6288f818f70bcb8694200093d2133f12113025119f5212798b6877b92 +size 51395373 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69848bd294305c81d39b18d2e758b2753ffc8a27 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27bdafd9bad33b0347c8d88467a3605883ed62d63f75f8024ebfc58f4b4008e3 +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f273d2aa2413bb238a158bafc65019c6e8582b0a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3d40c0ab25f2228279e01f03af950dbd8f5f80f9e72b42f4ad7de02797cc08c +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a6dc91b884dd594bd25926cc6cc9b491f3f31e0 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e539a6cbc65c8417265560c235e11493a42c613862fe752373345d7f79f5be5 +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdb00b12fe3d9395f3c56bbb12592ea087559c33 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ffc1da4773236f8b789ce05164189c49dab21984eb2e5c7f83ddaa968921179 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32796c38e75fdb2bcd9f5991c731b43728db9b7e --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96e143098fa72eb49bcc4beca85a7ea8d8d7fc9dc7f3470f0d3e6457d9d22b9f +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad4289bb02b0b98cf7c0d14015c35eab6ff2e36d --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94e10697bcfc1bf2e04306de2bf4564abae68fed0720395e51ae6c305230b581 +size 51395351 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8712b1878ece7bc77cd01c03d01f8a4ee4431700 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f18549375b069cf8785589363c269ff483d8aaa2948a8fe090a3494a39ff4c23 +size 51395554 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f511abb28dde5474aee5035e9c800d897e72b368 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dcde418d2f70a94e02337f0f126b85174b5cbb3930034d1e9162d32b4554197 +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05b563fb79189f10449750fd81f6300d6cb97b76 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3d7e67b0678f4cddd9553afd17e9762c934fcf580290211cd6d769c0d0ea078 +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..663c3195f8b1b712e80942b1242938fd1a8a05d4 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd3e5171f0b42c8911c66ece503e88306b6bf6401fbce999e127a7d2a91e4cc8 +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ed05577137418b18172c8a8ed04d3fc81ec606c --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b4e7b3a1808dc4e89cc88dc64f67ada053cebfabf8a00b55e40b6f46b787b95 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b64bd2e43a4e6355f332a71641b23541d4c1e244 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d2334dc3e5570e4cf5cb66c13b0dbc61049eb3db6fd17f16f291b6d5f577af5 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb4e3840440891e404fc3b9aa5809df992ff9ac8 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:140d70074e116ecc36ed48f3865c685666c825ab697ad7603c259bbe1d03bc8f +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9a2ce9a9eaf7d790b237f8829776e3968dab3f3 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6d41437ea2afcbcd41c6aee1482f069d5d22f6b0d54f428b6c11e47c5039289 +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38a7f097083d0af5887d359787cded311461810e --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a0b60c6a2cb3fb7ba20a1ae1a7ace5be088ee611f4ee26b24992a192a216b81 +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5edba1fc767d90c219170c2f38967ef639b0ef00 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1319923e232a06a6c24e1f7862554ee4a5b7af773345f03c2f6a9ab3fe428c33 +size 51395554 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b312353696a4e23d88150eecff99517bc52982d8 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e19038462183833bf7d82978dcf7e99529e11274f4daa42021487cb58b5afad +size 51395415 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fe4404c22bb9fe20666ab619a707f216182b359 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11c369ef01db1d0a2520147d487b197930970fae0f3a0d0ff8f6e87e01ac2208 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2676279b79ea35035e5c30f91a563204b80c5cf --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e1609c576f9d23d91c4c50f579a7b4f4b3e73d5b98bab87da75d3ea5eec0c51 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ae3d09753b7a60235f6a05e7fe107216b786ce9 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d69dcc2def652b50000577d97c1fadcef9424c3e30fea09d325f3a98a7978a2 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a638a4aba6f4343c21b8f9bcac2203a9c05a3181 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:034fa22451be1eae4a00d750b8a074c8dbfd2c055dc5d316819dace9e166decb +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44ef3a0f3d5f010eea7a5c134ae668174f6b2777 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d964293d19ce93e12373ab24d381a37f4253a204c0c80da854010b02a8d681d +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..568785ac254fd05fc5824bbdcbafe686e75126b8 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cf53a9bb11fe1687b1ebe3e87bde99a1930021a874e20f6b21dc56568267051 +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7f7de9acabede7213122a3067bb27c38f7398b6 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38cfec2ffde07e8bd04ae2318625f95a3137cbe4b64f6576b806cc7dd9f191f9 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1083f5f80e427ca7eff0ac6b6e10596f57e51157 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:987afbede2aad8401364ebd2f3422809567ecd566a723e9bbdec4c6525b6d019 +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6d09a5b26577f584b3a00c5a200bd928120dbe0 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f553e352b67eaa298e820149c1cc3f5d42561e6ed54f4588828ee71681f9b94e +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b68bd68b53a8ba5e20ff6e80908d7c6c296a43dd --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2f8f2de761c529dcfa49fd14f2cb80f23b91e49b30eaa26cef332bb950c77cc +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14dab3d98d205fc29edb52dadc976d1313ef4e72 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17e42c5b665e76b3393337816c7acbe68e69a9963baedf129d1001594480ddd7 +size 51395415 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..036e8877f01b3c24678c52f5efdb178114a473f2 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25ab282228674a61a41940b0a6e4685ec623978ed6a0dd5c7fdd6ae1cc743f42 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b2833473cbd2a9d272bea461ea0e180f01c3bdc --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3a5981d244eb02e1a4a9f2ccb4cf1e97629c5dd4eb4e561d0c73b2189a50632 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..127dfd72db78fd702ba07c38f04a3fdb9b345e81 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97d42694149b02be836d373431a22393649c8868ac93b9ea224cf6db395f1a75 +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec0f0a0933f1ee12955b3122e280e07930c3af9c --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57ea79a2628b82031f6454c18514f0c4f80003fea7138794c652c8421b95ec5e +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdd7fd7ebef821b12873a99d32daffc26dc81b12 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:164a1c60ff90cb970e9fbf2232fd17738247ee5d3ae37d5c88493bf1b05834ae +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6f38dd8c7520853030ad8c32c253098a6fd12b1 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0258f12064970c1c2571e14d2e34cc2382b5e894bbb7079c352f01423a7ef0c +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c3555853aea7528280e056843508fd977c09add --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7957e294193603e3f768f98709c80c5c34c8148909208a526e22e75d62623d91 +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..515305e38df32dbd2415a2c6a4587d387b486247 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccfe9bc2ca83b454e15f95c0d846951be7878a3968a8f58db13ccc98d07388cf +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b52c02e96a7789a596a1fb55bbec8643f5b0bcbc --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25ba0b4338da8d7d4dd748558b3b8fb973f8429f5b509d7cce06a1a946050cec +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1c5169ba17e1bc7f97ad15d1a27ef1f122f1de2 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa2200eea8ecc0eefd98fb05b0c6607d1116c9ea501be3fc50a74cfe6212f042 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c43723e5f95d25c84ce20fdc9b36970a52a1505 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1c107a63c1c971f7622aa41bbd688d5d21b7b42131f047fc99a2dd6f2588808 +size 51395415 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0035684024b93db9a5086b27231650156a791054 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4213065fad6b1322b3760da000cc32aa90519fb1bfbc141a2874d65de0c26922 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c67583989b09e1b52a6b6104d28fbef5b1e1269 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d41178e8e3b8a67cb016677017e8b010eb9369d75601e837454025fc00af6d5 +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..714b797e2f081a0d8ace945c17edd1f0eb0480c1 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:782404ae2040b0f82e14bc09af23af13438619e01f613576f7f7b260ffbe78a0 +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b3f924963f97a52f5a299d62c791c16826e7e7d --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:643de967f61b01cdd69218737082b3597d1ca9d1df1a5a37d38b080a1764ea9a +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..411ab3c34d3be8cc9aaf6b903c04b2acd8f4ac60 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:482ba37de59d5074a0189005eadd0cafdfd1e4ea8539effaea51866b704ae646 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce864466b73ffe49aebf9bd6f30ea3df9b9968b5 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a1814c89529945bc7c181ef436504cf77710725abd0d56ad0f62b8a718737c8 +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb04a0b8574b0cd9bb87fdaed5961176ff5875d6 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0763e0e20442270e9788603c5b8a9edb9b726e7ca19b5fea2712b9d8a22c76f +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..928a857897ffee45bc37638b1b90d2e0423a5779 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be8593373d1bbcc260f8bb1d0f4bfeecbdb579f02843014c2ab1189a19795fcf +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfa55dba7fb3524e0a767659c7e4dcc56a416bdb --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1849874b15db2e2a1ec588a9738c9d5825920d7c13e2a799a48c21296ad8033e +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b29af1732242503d21e224647f105822d517c38 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c88bbd24c958b0b3d36f3ce1c916f58c4650e3c1c6ef96ab82128935a3870e10 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73946a498e0ee0db60c18b5a1dd21e8bb95a1102 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:303e702af40679369442fb3bebe544910571eb288d224821003b05d0329f7d84 +size 51395479 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..972a4fd498184605b294f6592dedb94f2724c25b --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed84604bb0b22ee1e7210e83cf17a92da95b651ee5a7838982d71d9223d8e1dd +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6573463d29782ac7d9e8f93cb653f4acfbb897f2 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2caa35d1b4b14c08240bea95c43400a22373b44f8975954ba8d5df16610f0a1b +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab9e29cae3f3f9c9de460ea2f8fad592c2e96a31 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53d3b9b2a638fa19b1c42fd6a258c06f757ce945c4caa872eb181f0967135b86 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..820dc58718f12d11f02be840a6978a4dd605648c --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f0334c3ba0e57cfeb8a6653a0d87801542e71e275fa5758566a4e665b090068 +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c36628630b8bdff0fc0c4ea2f9ad5825274a9c8a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2394d899948536f72c2d032594185ac678d21d54c4afe2267e0da83f10bba8c3 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..209598abafa6054f2e3f4f7361e61b266c73ac38 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dad796c678a706fbaa45a3a027ddda2e5ac502694ab7e583e74170692a3afaa8 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e79ff28868259f14c96513d18541f2abe14f18a3 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e34927a54ad2b2ace2fd8c3b7b43b725abff513c0d21a8f9bc15994941423142 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2504b926c5917e0b3c3413376e5ced76fe538805 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c90a269795147585e5eb690f89c2cb86a1d2225072991f0879e37272f6956621 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..259f7e91c16af346e4ca2ccb4b37fae1e156399b --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01efc9fe55672da3029442bd92b3127eafbeaaf6dc5a9e50a3fea2abf9765f55 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfcf6d234f1f39e3f5e90a10ed99881e7da26657 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:103211fb3213f2ef5ccec956330435e1ac5f40376ab54bdd11b961ecbe0cd9db +size 51395554 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6611c462cd07c3a29890c0428813e8a99bc96cc2 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cefc2cdec2cf01ee781308edd8ff9e1cb69edf55f32febc04345f813420d9b5 +size 51395351 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e2e87722702ed23d2ea3b468d4910d07ea44aac --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04fe818306ed909aebb6871342a38a83e7963fe0ee820388ef0248a83adcecc9 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37cb4b434d09e67b26a090793a0ee54c7c77bc7b --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0142f5e83ca73bdf6af66393af8a7cf3c47d486833fb7651e443cbf8e09a78b +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3de514225d7838b2231bbc76e13f6dbfd23b1ba4 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc7a7b5c3da2a1ea3c2e70c51a07e8901d51b1e71c3a199fbe125b306627b07d +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b626952bcbc54c65f239c274ae5fc64cfbc7ecb --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18ef89390743b676696856ecdc44d813c3fff003c4807d33f34fc97321eadc04 +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e180501254e58d5ac9e3943daed644e90efd88b4 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ffcd0c6fc793b217403a4bc0c2ee650cef36af93ba252f8300825fa7f018223 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e37be15cdfbe13ee89df58ce5a9dd0f1a45b3ff2 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:634ee9f67be6790361c21666217d37e859dcfdd4d69b9b23aa032ea71b8fe773 +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2d32418140539a52a3e571bc8a736d990bcb2be --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33aaa414e8b3ffef66a669efde150dadba2397dbfc06ec6a357a0251f09e4322 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ad750244b05c3ba0e79460dafbe08f0486b81a8 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cf03c942251facacd89d96d16503b8dfb24883d85b2926accd655531eac795a +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9099d8951650b306d2a037627bb12865f71e8395 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20232de91a743a32b2a60c9c3c4fcbacd78c90eb0d5bb6677eb183c24c3a3ff1 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d348a9f40759a242bbc3457828a88af20860014f --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2381d1f974de357edd3212aa4a3a75a0949ff31b34075052df5f33481d6b521e +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c5df5e7e55b577ef9dc6ac8655571c428732e2c --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c601b3b04be55f7e2a238765814884be8b4b8335dc77b154099cd23bf3f0d33 +size 51395351 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4757626e40a29ad601b370481a44ce5cf4bf92ce --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1af628c78695f67b51d785102292c8db9f2b8f731e6925384d01b702224d27ea +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13a9037c7b62727ff97494b8a99e61f5e413cda2 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391596a3c43ad5bd5b7954c33d61c72e1b3864b00bdc641d983b24d5636ebf34 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c361efe1493b5323c46c00c07d7b44c2af59720 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f664a23cf4c8196a1101842986baefc6202c4834e6918fdab2678012c2f8e558 +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..309f4cd0196fa79665babf2b0b79c2d1b49408f3 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51e04739352813ecf25c908e7525cf0a29daab87d1ab1aa68c1e07c5ab2ce8d0 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a278380776879f0af20aa792ecc5c0a55f652fe --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d026795ea6768f168ede8f14da58b98cb5a624ace90fef4dcd99625dfd2fac84 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec7ac2438134a03de366908f384916b68b76825a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83a044ab6213e1e48136037c47dbde64384601472a62a485e02875f57029d2ba +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a1fd894ef8d0d0da92437f03115a6ceeff27256 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce63a31ef33b89c1465abd1b8a24d0b1cf326d6d3a945232284469ad70e9f222 +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..985d08c779f3ce0e49277348a1cd1864d7c7b73e --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c58291e8545d1fc39f98f3d10d1f9db3c25f77ebf14aed03f56aa1529901e5c +size 51395490 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cbe0ae858c09222ac923e8f6f78d509c9700b98 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29151328ee0307dd2209cbf55bdf7d59e4b1a295f612e75dfbfe2502cc91bbeb +size 51395362 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e76766385d09d290571d50b0d2bc96a6d0989cd7 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12c6fd12366eebcf5c20c1763fb993a62c1f4f7cd834c81d5d30fe5d67e848ac +size 51395426 diff --git a/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bca83d6b5412718091f7e65c45b2417ced071b0 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05e1ec5dadd9826fff717ba52ebe659ddd20bc441e00e05872335273341af49e +size 51395479 diff --git a/1b121b21bc4seed4/global_step39672/layer_01-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1db157a23ee2966aad46aff33d71b5a1311b2b74 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8daf68ebdeb577b4317309907a78dbab206164c01ea5f3b221467c969a0ee60b +size 187630851 diff --git a/1b121b21bc4seed4/global_step39672/layer_03-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c78280c813f415f34bb32ec1323ed7d66d558a0 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:388127386fa52961717726d1f3b4ddd61364fbfd35847f4e15d601486aac9156 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_04-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04fc7a112e641d57bde4073a84e247f37546ea6a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:847fdf2b76fefda31e5c88721cb2699bfeaa18711a9e72fa6b3e729c13d3222e +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_05-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee5d4f95593809db2a92972478b3e3c0f9db3a76 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c5f6451034a0490f6a33b16b8833533f74af7bff0aa02d6f24bed4dba181dae +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_06-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9b04321a09ed4571bcc8b78c1836c9601a2af1e --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:048b2d437d1f335f3ef4c271659444d32cf74349bebddd85b285597144cc6a94 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_07-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..972c3ed00d028b1ee35c94f889380a7306e65cb4 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05b02cacb528c752f2b52d62c7f461d613846192de0e92c841b21d26403429cb +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_08-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d7fcbe68bbcffc6a736fe8b78901489c388137c --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8c93ca3f1673591470a736e4c2f9465a749ec756b348af1577e472def61f759 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_09-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dc996392343a73e1edabbe4c18de7db9408f1f0 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74c6e15b582e93d48a8b4ac80b53cfd851da579cdbe3556e04cdea395a8813da +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_10-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05e008d89acef56373b31b52bae57c6f74615622 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd553aff5c89cb91c7df59935acb7d6d499f8ef8189e37bd38de6d8a8a8d8e36 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_11-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da8ff88f2706a2cf4d12c9fad4e320b824483bf5 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b4621f756e9e5e98d6e2b8448742297bf6c4004a56d95ef6f28ead8bbb043b5 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_12-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12f68ce63437cfc1ffa4200321469ea7450f448a --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f2e79a0d42d31b2bcb8cd479aa6c89391317c73735a2b2fddca6812cf6be1f4 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_13-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..798e4ffda9e5cc69048779f453e7534ea09b9dad --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc60c8013bd4bbfe7c9a42c6465943c789d0c28094157503dd88653eb52fd9d0 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_14-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7fce568da8a484667c938312104a3f750193474 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c730335ae99909bd444acd5ab6a5fa072565fc2321c335c8116c4509f4353e6 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_15-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9757da456653a420aca196c55ddb37a51e957a9 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81829aea504d75d9900dd1b61e514ae67d4d17d6368bde8bf8f2607397092086 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_16-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96478b11007f17f6f2386aa9d161920f44dff215 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:415c8150b7283e660941e7612b115b3cc1960da79878a2f4adeadd82c1ba5572 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_17-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29fbb5db81c32af57f1003921c61bdea33dc0f2d --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daae8743aa170e00653930debeb75fb6a0e4b62540196f9c22148b06526d6b20 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_18-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a670f6cc0ad4857a4e82e4b2952a534ffcd5f581 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce1c943acaf3981ece079532a1eba826ffcdaf1ccd0f072208bdb64946c94594 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_19-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ec4670c662674f92f3caa6ef4120909dcb696e2 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cffd7e2d29210145941439a2d53a6a5454f74a61fca58224c377fe85ca5600d +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_20-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91fd95186c716c5e33d7b857427bac48771332b7 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:920e6f01f6481614ece33cdb24dafc0200918a263ac067a2bf6904cb9afb115e +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_21-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ddacc9fa6db83cb726f370d542d7719a1177e09 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efd54f851f2f12de8fade05c3f432231088483ebbe4f4203e8cf6ed88b24ba87 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_22-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03ba45e5b8a11bc17c43bab5cc41c2579290fe3b --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c339fa670460bdd5e3e0196ab890cac82ea7435a3db000f733595ee7bc62bc99 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_23-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83dacdd17f5f5e429764b7be29eace43dcfd824f --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2b9875e97dd4c1f020917ec0ca52e44e30424ee0d6aa6a8d08d86a1f35876d4 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_24-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1337e95c5cff4b29a3a78fdcab048cf4b61b4762 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93520bf0f3c6c877e7a3718d28407dace54a08216ce28fa0a73362f44ac4b1e9 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_25-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5686f1a0fa710be65143e76d26f844dc97d4a15 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62cc6c5c8e2f9a542dab684ad067807b2d99044596e3ffe71776deb148a7d427 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_26-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f83968b6a7934ec29a7ff60f8c22718b07062ccc --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f68c4096f445e35b99d3bf45cce2cb12b6eeac18cb48af229834d73facaaf023 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_27-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6282c18b0a7516f1bf29e22d855928d7b4f14caa --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eef0e35d2345c23e64b9df05038ef13dd37fdc681160245f997d688606b9ba14 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_28-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b3fef71627ecba32321f951453008dae6c517e1 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ed7f5eba9c971028a5ac926ea65bbdc44585cc6fcb548cce71693397a5b5ce5 +size 77121283 diff --git a/1b121b21bc4seed4/global_step39672/layer_30-model_00-model_states.pt b/1b121b21bc4seed4/global_step39672/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff211dfd750644fe542953afde37af0adbc25662 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3459f1702500f2743add31b5f05fb55f146bafce3f1b656d27f90eca5823d7e7 +size 8387 diff --git a/1b121b21bc4seed4/global_step39672/mp_rank_00_model_states.pt b/1b121b21bc4seed4/global_step39672/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f64a205dbe34a2209cfda7883b7b8fc6a2a37e62 --- /dev/null +++ b/1b121b21bc4seed4/global_step39672/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ed8e9c5b3cb45806fe8d214971a43eba878545c8218be92b80214cecaca7e8b +size 43827 diff --git a/1b121b21bc4seed4/transformers/config.json b/1b121b21bc4seed4/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7120acb75187622c061f0425674b658dd9155502 --- /dev/null +++ b/1b121b21bc4seed4/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50304, "n_positions": 2048, "n_embd": 1792, "n_layer": 26, "n_head": 14, "n_inner": 7168, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/1b121b21bc4seed4/transformers/pytorch_model.bin b/1b121b21bc4seed4/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..6a988dbf9ceb8d254e85f0763987ecc9f8b85479 --- /dev/null +++ b/1b121b21bc4seed4/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e9849705bee618659cb9b0c5cb84c66611abb121a0a922baa3c6d1eb2f1fac4 +size 2410895501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8d4aca551f30b0154031970361e90ecfbbec0a0 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:165edd01e3cfcb80885a785204b444c8d45ce8053216f100216fc54f7f02a1e2 +size 51395415 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a8740d2e6ed3eb8424553d60912219e9ac72a84 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a50711cd5a0b39c510bfdc4846bc7f2fa24d3506b32911a22249dc45382a008f +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d989cda83a47f4fdd8de9f1e2b36831914e1af0 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cb77a1515df0ca2c339d490a20a9cdbb9242cdae7b0b7dcf71279654b2bb315 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..109369044cc7c281939dd02aa4f3d856a9568aea --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e66f2fb4fb80bdc4ac1f9c53a90d8adc73cf346db53b8c7ae6367c3092911485 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fa8be1029a6dadcda9d1fa84666b5fd5c446cf2 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3445aa3d5486592f9d673b4f0b4e950ce793956cc4ab6c4bae57aad0db7c3261 +size 51395565 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f1ecaff12f90727d53350c37337e9327cb113f5 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fa0d06d738c73e364effc5f1abca428d2e17ea54674b932410b53b9d8463e2b +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f01745714ffff69067b3711f29ce6074b51ed5f --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c38d0bc8935a7c3d1b3852b5a69d92288fc1d7aa4b8c4afde95ad145dcb447b7 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d598dba0a2a18c151afb36626b6ba8dcf8e7452 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf8782e970698845fbdd02b864a4f78244867f09dfac5ba5d9b740340d9ace8b +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e01285317574f390658e0ddabf036407f2078c39 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ec07b86e3ecd571498d32609865bc67507066e9f68f0cb1c774d5e1dd7c1c85 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4ac7b6e10e76818d9cc0974765573a954187a5a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88da7fca5b51559b70be88f2ef7ad297d389bf74b4f70d662fe19083f894efe9 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0566d6cc1757831bf87fb0d87321cf022f3bd72 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c393d2c54d83d9414664b645205de7014cb2840423e7c29dbd4e87a4308a8774 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..242eef0fabfa1f9a3cc3aaa4d5d3cd5be59d7174 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a97d49898a3daff88e8f99ed728fbc154a1dc7c87cf38a453648b9edde4f5c26 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec2f6a931ec4b07a490699a47ff7c6b4c4d1c0cd --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e30843d5d4fbbc8530e9cf6f1412a7aaae3435c0c467eb1a62332ac12d1f6cd5 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14505b55daafb75dd1a533b097cd69326562bc43 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a4092e48ad945b8d72e1f2fe5015d525f578be64bf98399aeb798fa114e3973 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b97288be69fe8034deefdc6898353dece170560c --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fdc05dcd8d843754a055c191e2f64d10db6762e755cc5c24056c8e078bb8eae +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ed45e81e231b7e2a15046449648024d6c6ad30c --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6df00006421ee94d4665471b31b69cca22f8cb8d333b515642741676bcba07db +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfbbd6523d399d553822a616547acbb32238a2ea --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f10b0fd76cc1ba80f5cfef50b7c6bdf948205f4275318c2daf3cf113db191476 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f480848b782fd21988e80d527540ee848987e0e --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:654d7e1fe07fca9d207bf643d8dd6f6e215c4719f5da7bbb88afd42a37f66b81 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0931f1e08bf101637ce5b6c7f2f760278619eec --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:015a02190d5dbef37ec7b0e8ac1afe8e02624f21fe21d0096631162f131a8a67 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81272213489e1fb96b6ff3ee699c1a9040f05a35 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5d65c200a9052af6d057ace631c3aa518f22ff0e325b8d0da73bf46ec2044a8 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a56acffdc0d05fdfe1785a79029389a22d38e084 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ca4ac45a95f5b0d6ea6faccc804fd4b05f5c187c0b07d0db5e8ca459f9d3b76 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe5dfea302661ee835fea02c3f6138bcc71d5a1e --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42f07ecf0927a82f31b605cf79f95f1deaf3e0117359da589f862e97859cf06b +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b6b14bd7a726d9a84be79c1c8be76af6b39ab04 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42c18c26fb2589fe4601d86b82d39ebebe59778c80f249bb3284af574bbe4cef +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d34c0e65e6202292b4ced946bdac66db41b3041 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6d979beec3e9828fbce934cf58b24a3f2ff75623a15293cd98b643b393eb977 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbc75703cbd3b37645a33622451cb931a28f6b6f --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8060f01fec81148e29b610dbd96c31ac76edcfc28e2142f43154b4b190edae17 +size 51395565 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3029fcfc9add2923dd903c3c153d25ffae9b533c --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf85f633a88fd72ec419bcb44011cf34f9faa944e76adefa508aa7892b646ea4 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1a3cd5e6e8b3efb0059d7c06ce2740bc4c57b9f --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9481e26f3e16cb7307c6ebeeb26afa18a37cbabf79a4262c33e8e015923b45d1 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4178cc36e712531eb8bfa52b185c50f27c77a6fc --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d57444cccd69a5395f0a0e7cb8ee22bd4acc33cad01fe392c62df934066194e9 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b667d025cd9be202b3458d3f94927992ef4b6d84 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:728114cc391c6396af793ca85fabffad44d062f924dbe997179c817d2127a92c +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d1dc2f1ea9b646e12b4a5eedf7a6520890dcbda --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e02a5cdd7287d3b7595488a01e9a5b7958d25e31eed3aa4ba5efb8b409612cd1 +size 51395565 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2aa3a6dad00b181eaddf57342742712488cce13 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a95e4810c149b30baa79f82dea0d6fb37218c6905712b96ea6a9584a892505c3 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1524f9e41426ad9e5c194ca8022b23697c09faf1 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_128_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b44a34590363dd998033fba807be58942a90eb9421f159683fa671d6640a91d5 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e1f8343b375356567dba1a6404170d404e3039d --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_129_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5e4d333b4dd4b58b5549fba9022437150ac23cd73f1e4512c395b7d3de4c6d4 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58d567d2cdc18ee253c032f039faff74181ab052 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3940ec57372a1334664d0489b942771c994dcfdf6f63c94676417588a1e24bb +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6c6cb0e548a737267b22bb6b46779edcb3118d2 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_130_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bf23e915201638356f20765e5b0e126c433d624ed5ae065575a4f7642213e3d +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..482a8ebc53d7a3409d3ad43c1819e9721ae8888a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_131_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:709d15cef632d55e44602bea25e18ba027d2e03b77371cb780c4b206d87ada37 +size 51395565 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c169ae5503cc0b91fdc43dadd2984c8a07d1a0a8 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_132_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e30795eadc2ea35d753ebb5578f57c23b8db68167cea2555a59d2cb04bf34a3d +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e869fe8db23030b19d0ba0e25e2f4ac44ca3cc28 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_133_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe005b52164a33f94356721b7bb261c7154216e2b499877db7694014eedf4bf3 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..763f529a086ef0a02ecb1117692b4f49e4b49efe --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_134_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a64e9416e55f287e6726090e5039aa4c3a9f0b19bd28e730761811344027b3ee +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8caf408d19672fc18036e78b6d7666567181a1a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_135_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35982f925fd02db4d53063cf0871c63b7a7501a823b3fa4e0f4699f10b10756a +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..633746fcd4c2d15812f4d89541fa4745c57aba8e --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_136_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dc18a204ca9775873fc8317cba26e44509cc0148a9128030c601dc9625b06e78 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b60e886874f0761b9c56f7372c58d5c3e2fb271 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_137_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24ab305115122b9c0a2319081012ba67efa752db5f5f596b733bc89909690daa +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b760c1e0af70e7d1d2a3aa27b0245f1a12685a3 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_138_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c90bf40c605cafc39ff0307b783b856ac2d7852e032aa28e49db3e8457b4380 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5438b81b8d3196129eb6f7281ca498497d4d825 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_139_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eef1fd57ee1597317c40f6f1de7841c89e6b4390a5946b939033103573e38782 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..350ad25ca750edeb18fc34ed27b3ae5ade75ec90 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c72b0d018ece8801fdac4daf5bafe70778e5c39c5159a91630f3ec23a119715 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78c81fd40d4c84b75e7b600baee0c86a286d0a24 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_140_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4069df89615f96b86f05b14cb0bb7eadf6ff37f6b20ebec2ca2435ff5f1de333 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1575dd635a3ae15b38fd68148d123d285faa6657 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_141_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca3e541f865792e25e9e7c1964c47a3764bc2524a1adce44e9a0cf34a22163de +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15d5c12c48a1ba890f918ee13265d4dac4579ca3 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_142_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4e68df0c45bc6c67b09eb45cedbf8b9fef3b1792ff4c2dffc10fc2f6d3c624e +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5c6aeffb01c192a96e5b4af86dced50fb5c9508 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_143_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e81923da77d5e9ec6e09a27edac66d306a34bf231a12703e34f4141f7b2548ae +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..356b14dfd42f21d1b2c5d47d5cc2e0b1c398c49a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_144_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51cbc592585968b9895f693da00fb6d5ccd325d4d6b7946274d200ad28bc885e +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c61c3cd09e13ef740df9f06c8a1715846e21f83c --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_145_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d42b4124640fc1338c85beb64add9dbd8bd1befad45dfc790508df355943550c +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af16d4004937ce6cf858cf2668255d4eb2ab5d4d --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_146_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a3f172afdd70ad61d04b70f1e7a9d140de6d294db649d3b9955e48e5762656e +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb8f2066f392446cceffbf7054919dd68f734e1d --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_147_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f9bb14dc79463314b51cc7ef7b4df94babc47eb3824701213f3f47d2f05a769 +size 51395565 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cac37f08a891ca04c2e875e982d0de0a16e5192f --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_148_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6c666f32bc8998648e27e3e88b63dfce71db7f6e7dbf9c1f79738b08d1db7e9 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..368debcb06dbc71d9005a2156a061051c32630d5 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_149_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8657aa5bc0b84d821cf14292ee16d05beae589015b38a6de95616cfce1d05cdc +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4963891f3fbc3608ab56a507b803f97674e13962 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07aa9dd14484ccdd78c727fda93a06bd9f2a6215d01fe1095c7889c48dbfd110 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfbba93de4ba7205d1170c9a6b49b71373f389c6 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_150_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a64a033e11d3b7ab092b1d954035bbbe19b783d7143c91ca9f73519fac4241f8 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0915894eaffb353e26b84aa998be233e7aa69043 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_151_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8fd31428533c352b5f6cd874e61a3eeb1af8dedb6c61de568de669b70fa8ef7 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..771bcb9a7d16277ac78a380fb83889063f95d6fd --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_152_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb3943909e0a2f3dfd93e5397526b7fcdc3aedeb5d85d887adb7545c4a909095 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac4b49e0916b275466cc1e5d87f8b2684045ae86 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_153_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e561403e2f57ed16d960864c496eb803f953f99c4fc2446896257c5d29f9e0 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62f170b494a311cdd1ddda3de105d0916e50c7e0 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_154_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8321849216199bdd3acc7e4408d2c4578a2159a9d881a889316fa1b0d56dbd68 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c29dc008f4b15b6d4a206da594f08caa5e77f45a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_155_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:167036cd1d3456d3e5decc8bb6ddaff2195348571d85ddc420567d05a626479a +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b031cf1a8de7857537c6b516ce1727161311e7a3 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_156_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d189f643fcf71c1af871907f2aeb9b2deecad22aeb4cb03f1c2f7a7ae15d571 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7d85b78a3343d5f5cab0f8e3c189711cf4a6403 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_157_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eb5c240dbfbb72bb3217d7cb53591ec46a951c622c44894e37da923c2ae88d0 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd2f3994c3ef2f2ec512d7b85336d539b8748f8f --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_158_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bba3caedd74f8575fa3bdd538e99cac4ed0f1c9695fbf2b8473f9a3304da857a +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb2ca19bb47d5306f8ee5f052833209d1324fe8d --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_159_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab3531564c1a816de4c2464935e89c53f3d63132c0e5ca10261413be13049322 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f7739468370764704a2c0556185eee168836039 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:492949d808b555e7a99528a3a1e61dcfa4a0858fbad260c6fffb73e2c2c37839 +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc52be4de7ea4c9149c7afd9a2e8ac0b3f1c2a1b --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_160_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f6a6717008fcb2f47911f2b6d2ef1b83e9c03361349c69e8bbb2b526674899f +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6f7f23c5413c24c5fe78bc7eeb1d7122f37c491 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_161_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf5d46bac99073bef7384eec3c6d2caf4127ac3dd135233040faf5de80f8513 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed5ac28463190068534dc205dd8369a7ad3b4b40 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_162_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66e7ba3cdc7c41d2aa099f4c631131b929ee0d4de31a004f0d881b1c24a246fd +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f020fd1642dd8abc61c2279e757492f96c8f5cc --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_163_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25db131a438c8cb41b458a716c8e148385f9c21825f27725a8543a5b5e44412f +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..596d16e26087910285820653c65bb1dc3643121f --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_164_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72735b19ad8a3894dd96f664eeaa1b74e4dad3dfe95232bd460f9384de9892be +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cead802d6720e092ede31d1e2093c2c50fc26b9 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_165_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a184a9f355913702adc79d9b39ec8076258624bdd11c62c96c62f6915e75bf0a +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2a216aa028dff0747722b970a817316b7266752 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_166_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:529447a043f2d588f227aafb5175b5dd70a13e5b8c28099adc9ee21eff2650f0 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24ffd94b8003d94adc05686907a672ebce0907fc --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_167_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f47006259a27be31cda18cbf04f6dcfc9314d93037e87788b1bc79dc1aeb52b +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb358f1524266df4bfaf3d17bb0caabec5ff0c8c --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_168_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fb9051bb43313dcdebd4915d930a48317f404fee66104d9d9494470001a0fa8 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0b27d6bbd5a0d811ea787d14162e454d1671f7a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_169_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c38323a4d78ddc6b53e3aea4950041311ea8fb729993d6e2876724ed7ce26a5 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14a91e3a5e8aaa34b1733a04e0fd37d9e4af94fd --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c45d396db674ff2d84a8172116ee325842f985e1cd697ee706a3f903dc4694 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..862ebb8ce421df12f842bf8232f5426c08e80d29 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_170_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e189acd83f8ba6df9791447cb9a1eecd55996336a33f2f8485ddb53ecd446068 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8acf480f904af5accb3e7fd0f0aad1c67b1f2c62 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_171_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32e4fc051f136fe6356f42e4dfd464d6a8902e985c114b7caa534d5a8e37f903 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31f0baed953bdc81d7d6b934414b3a8b5fef3970 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_172_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:948ef7e1c95f961f8613f30310e4886319af163124f781b9b334b435df0e2b7a +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82037254637e518922d52c9a7f9d91cb16e0a41a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_173_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9a1948c843070fa8c3c2c88eb826bf7909318e3a81d01390bd722556fa3c76b +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b20aaef480b897d66ff2523d0f8a8d0502b76146 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_174_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:872b92e02b36459af0ffc6f176d954f39b3cdece9ef181ab792a4e97acb7cc74 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d0b173b0686b2f46eba29710bf160a0006cacc4 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_175_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a56d775c5ef88508cd356f6adf5d2d0f09f4b1853196fe2a90a92c645ffe9d3 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad8eeddca6c1b7b977f386b62bfb2b2a1b81c434 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_176_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b41acefb4dd91a12351a029d0d3ee31433d2330b68ad7c0b9564e0db1220f4ca +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95e4cbad242db173be5aa203830ff2d545e4d699 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_177_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3445ab87f368a3b01aff6abc6d227dcc61ad9b91041a6d064249c67c5ace05ac +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cefb8f426fa286739b86bd4d4e0554f946b460d --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_178_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86d58b0ed573c2775cace151892f1d6e49f1120e0d905791dab0cd444513b242 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b84ea14a421a09aa3ffd5bd8c31d9119038c473 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_179_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af5fc1da391f49e2a9fdf64971007da91b27df6189a8e7f54ae1ba0b590d8d8b +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30f6b5630faae137a56866e56f04fa76cf215248 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f045f3c9507bd0d66a62891ece9a410ad0e928bdad395fcfe5323afa9dfed03 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d14c478d70a1ae5376c4862e88286bf5ea4a8921 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_180_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c887fd950ed12f3591090ee59875488d88a0b558f6e15eca7272358230943256 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfca64773f2dcd71adc96ba3453b5bca17c2cb0b --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_181_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d0e36d1c24fb29814cf54b406ee6b6703edcd7d390d88c227532786088abb25 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa53782bffdf6eb016da84088b8c574893926eb9 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_182_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02c42e0791374d8eb21fc88cc9a1595be79b8de9f37835ca1c75ba78ea2e28b3 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7962c5c0e100160b4d3981a2f52e4ac163d55884 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_183_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1aff3cfb26834595c00e0e390e7eb770ae70f2a5b6badae4dadd1f8a82ac4df8 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20d40f075af225339609839b2d0d60ed856a0106 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_184_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8f067afe4b05b12c81461e509156daaff80b96ab4640294a44836b0fe131ce7 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f09026417c0dc79510aa6a8fb834fc0cd45e120 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_185_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40b608f956a1343c1878e82bb169e01451078fde35a3df210c6a6f4fb68fd600 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6e90106527ab25b222174d1e9501057d37b6dce --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_186_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb3de36934f852499a638b9a03583822fd8c1dacc2f00e961b590f4cebaf8b14 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff5e8c772d8c32d3298e475020c5ea0f3984f071 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_187_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2056460b4429e90ffa5dabd713f882d0d46b866f95df62ba9925c79ad5c5843f +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e3a08ebb1ee7d9ff883ef7d179cbc95d3bb42cd --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_188_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb08df78e9cf0f88507cc6aef9ef68cf4c2243143e466c016a58a6713698405e +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d31a81f2e644b1c36d6d9d0a503a97969c21ac29 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_189_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:766f9fca697b5837332d3db8327ff8b86526bcd38c208e85f3d51a0988d502ec +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc5548668f78542e9f9a2757512cc8353156f57d --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb43777c2080ef43f39bbe4d5d10ee948d2527c599d9329af701ab43c1e7387d +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca307fd4081173a89195e8555b55b33de8ab5782 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_190_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbe4420fe4e265460f086c9f4810e44c5b53da03d437a9026cb0de7ebfa2d6b6 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f19a574d84c6a097ae6501deff37d4d75e4a112 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_191_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d18fa7d779c74146c01005c54f5552734c89567a9556b777c033fa57892d6117 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..502c5a3ec340129f48d933c19d23cbc7bd840ef5 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_192_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bed88e02b192b52a8ef7403db6d29e7bd14f37798ac3ff35d8c30e210b3f0cd +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86df5a3270b94fee513552115543ff6ec26fb166 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_193_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c753f682e05cbe6253e1b87c69e79f5ad5b23a0365a24fb031375010b83cd63 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..367b68a3244eeb9595aa8acaa4e2657523042d81 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_194_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc0898668155e7fbb0249afe00ac92c95b7c7aa78dbbbb32991f49182de28a72 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d28b4df80c354791e96a53776e9ae9795d97a26f --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_195_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a700532a1dd0a04563fb1215ae4218191aab5fa3b1405cfda0da2b9ba3fa4e1c +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48285bc7b3e4713ca7c27fbaf7432ee3ee6404f0 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_196_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bd21825bd7d464e796dc35058aee01697cd9a336886983b89df2b1cfddbcb97 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d83d740657ea8bd54dae70fd5b001544f64daa85 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_197_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:066f1dc1368401650a89b62af1caf605845c13fdd61cb9c2ee1b4f69e22b8205 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84c43e1c82afacaa89e2105352957c35c74d8d51 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_198_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac64cd04ad76c03d039fe818eac8e8074c9a585dc0efd6ee4d9803904d71e63c +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac14db254e9931db8864beedc66efb74d0f22220 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_199_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bac9bd1d770510dd60d4f82acb75a724070d003d67ca1af8057eb3f170a797b +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63864f48c6e1af3c6e665c468f69ac6c55248e7a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2f7287dbdec813bfab8fb204a630e42d7f6d7343f2e3f25b759631eab0ef9c5 +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59e55747933b594805461e28fa35aea9b3c37963 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41eecddf032243064a9fbe2e89c41da4aafc31fd9a92a45e29b2ca89181c7638 +size 51395415 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfdd57b826484442fca65064b8aa91cceb31f878 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_200_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2caba57f2f9dc4ca59a4ac20b887d2859fc5e256401e499b9d0a06702870816e +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cd241c1b0c810e53b088c184c58f77e9110d8a7 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_201_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9134650848e7f2e98a9f9e45a7eeae00b3d66065e6cbe523676ec8fbde06ea9 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d440494273d8f3b966fb769c2988e8dcc30df0e5 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_202_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0c2630d44aa7aa375776a4353343277d6f25800b15c2dfa78a637be2df688e5 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0225d764d9d593daec1d6905618caffe7b55959d --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_203_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ede73f5d0fb8cfdadf14cb9b7c1c303ee26a7d2ce0667f83119b9bd361274688 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4280909cd62afe03e2e723035b8638362d885ee --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_204_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29d09e4ae07b7bfd0b64227ebb6c67e6ef9af54088c1b3b0ec66e7514fe277cc +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43e91c5fa22cd6bfce16c1e18c0e248193361122 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_205_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4afc4be273f5e6aa8968cec4933a8c26922b3b2c5cea923893c9f12cf8a4120 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86624b3f8e848457b0b321d52432b68cc139312d --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_206_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:694ed874e140893bafa272f4aa39f8edecdb4ac1b58fc66bdd1f54e8522f475b +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eea2d8898457cb4a12e415f51b5293b301e95e65 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_207_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cb3cb303b7f158104fef61ed5ad773bd4362c2fce46542b5c5fc7722e64f246 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83649061727cf0de8bbe54273ea98f23ec4b58b1 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_208_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:093d544fbd673cbaa5956b6b39b2921404c9a30664474bcb68c9249d8869ff54 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9cd4bfea462465ede45822f2cfcfbb24935b6ab --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_209_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d09d6b3846df370ff7020b4e959f7ed4a341f6086e1326bb2f66fedd463ad2e9 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89c38d30ab2af11ef03f1e2c669a0fa243978535 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:251bdf577289634794400e569c3abf185f94d967b65025f34b34aea155867711 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd8a9df8d04f019c5d79902945be04d41f2f8cb2 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_210_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9772a392a239147dc4f025c1e88745ee559d4ade13204c94326d1b37cc6cce77 +size 51395565 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b097308d106d93cf3e554813ea8a6bde11bf86a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_211_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a469cb2214692ae82914a49a147b6ccf8e56bccd00d161db02de9243af3397c3 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..473f9e1826df7e09721a1f23f7b9744878676fcb --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_212_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:028de16615eed1b7e8382fab6a12cc7e733c0d0a0b8feecab4326ece2457435f +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a6811c60838664994c4c9ffb47b90c39d223e30 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_213_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5118788c6a9e804e38e1165d7ae5ab3f9fd6371310c6dbff5d3d594404fe1126 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dea0fc52fe332ed66d0629c7467aee1f4e28be05 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_214_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34ee28bbcc00f2729c73630792a73c7cc1d84b03ca38763255c412ae61701729 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47cbd10aa50e0f6f21af203cdc0a6417579f942c --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_215_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f84e41c4c30f26ad26f10a424962e66a4a28940b872a6d3283bf221ea9d0d41 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bc23f5ecae9f67ff34b25c774d7bc1fc43d3113 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_216_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1484bb812811e76a06c6337a6a7eb149ab32694dfcb6ad58ee2f3040fea20fed +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d66387b6f18f1dcf7e17890593e372e7ba0f0d6 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_217_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd4a0b4dda7f9a0744d781bb05878979284b02f1a0228024539c48fe89f458eb +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a791453d4d3859834da6787b95a7952938dc8949 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_218_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e27adc544eca6c2cb3d6116ce13479809dc823c3066751168efe9b116defbed5 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f985df8f633105d13b14f425b270ef9d1767327e --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_219_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccbf0a8a1acc8e89ad08066af8a84590d8d42ce2c3febfc03b6e5156eea01961 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f090448c27534dc18021ee3b47f0faf41fd90b16 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d5b93283534b2b54d87d9636ed87be1993f3d7554dd954028960b7993f25257 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbdbd44e409cf85cfb18404eb401b9b0f67edb3e --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_220_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae6bacf4fbba9b6b43024325e70480b4943651d1e53f3b5f85b25acd624c01b +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..593210430ece1ce43ae158ef140b33273509dc1a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_221_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc94f880e1cc5a1c9e918510d0942ba296e1eb6802fc4d9ffa220ad9e150d7eb +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03508f0dadb73f1e0253a70279458d54ee1c113b --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_222_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d34745d20d5e238424a24cb8a67cb8ecd71a87f4b1dde50eb78794230d56d3a1 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28d37121c842e6dc4a32b1a62807f16cecc8ec47 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_223_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad8e256c7654ff2b8d0260648c517c59f887d8d81f95a8c66a56a29f026329af +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8a5f4a742b3694bdada3fb833be3e6d7d6f2c47 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_224_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7b818fb9c2d5edf7461bf9cb2787640ff95cbfc6c497668e3ae0d79cbd5861a +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6634909a12e5dd954dbf251cadf32ab314696ae1 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_225_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:253d969ffeb897fd36bedc0d4c0574ac6988fe6d9f94543db5ac111f2c741ed9 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8ad469b1ea601d9351684cc6050aac8f41a9a0c --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_226_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aecbe5c26d55ef57e97309c4dab476f4e2b265e384916ad38778d38f5d387ae +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca8089a0b6b4557a8d3838a6891992d48f0866ae --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_227_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa840c06ce2950c37c486be4daecc4b28765eeba744e64a550b5bc732031091e +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bb1475fe945ba79a02112100ede048ffc4c70fc --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_228_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e9e37781cdb6e27cdf635c51faae5d4f2e482fe14fae1c5984f18c1e83229b5 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71cdd4dd6aefd82070cb13f238a0b7299feeab9a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_229_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f329dc699f8d6f5c6725bf7f8703444bdc12d7c3d28bc5ae15227cef7c37ea7 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8e81b503c0f627fcf4e1f49d8e4a1b3b5433f91 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c28f63d8a47dbbe775b3b208486fe22656a33cf777b8a6a1b860bc2bba87de25 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdda55a97b61d0ca5f28786cf32023c5f49c4165 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_230_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cb7f752af4b925f84f3082f341bb411060152596385d2116d09249cfdd60c2e +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67f502499e2022a91b0e5bb05071749617675cba --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_231_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a447043d98995175dd925aa397fa974a38d17a9eec209d87bb3388972ff18d0 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7b6a98767a96555b3aa6c93c0388a45f079f729 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_232_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e72121356990e61fb4fd0b5c8b79ae1b36cdfdaf195b756bfd55e3b4072ad972 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9ac09bc6cc2022c537c05401b557bcacb40a693 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_233_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c072bd081f6e809aa7358c49f19a1a33c55abfc29f86d01ce773ca2d00a505f1 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bcf72f05d8f6d0c881737d2ceef23edb0cd11a5 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_234_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c18e8b9fa674adc0bcd07a3fd2422964c6d17567af5d5f61f08d9329211bc2 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0450bd54461cf99e6582a6c19d82f34ebe4c554c --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_235_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d01635f16e5d29dbe54530eaea88710143c7d3f1a799ecc8bb8d3944e9da6f7d +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ad7d8eebbf2f24f68b59af8d662d40dadfdca75 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_236_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2118b52f642ada3af6e1489d22c79e8072f3e8b42cefe65c5316cdd58e5ac3c +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14086931d897ea586b980cac5664311daa525aa7 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_237_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72eb460dd370e4ff740f2b809542ed3b01531aaf1e285e0dcff63e323c71a664 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1f9662b36d709fb3776bde31df9ab1a1d5f5346 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_238_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f581d8d16cdd6b72c4de4cd3f59455e062f150f741297e115f849b76dcbed6d6 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e29c2bd4231c10a84664e1d0a359a1f083b2731 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_239_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4094d678c6a1963f2198e44db0a47f5289552ab0b25e68f6cbe6f2e14c395151 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7ac876e9fcc7e9580f0a4a4cbfe981b09837bb9 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8ef0fd409dc010385e4aa498d1d718da1775bf4b2ae709d00541003e8f4f938 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77d3548f8e19c8e0a7028bda96e6409d3bea6c0f --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_240_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adc6f5180f7e376280b02e52454967153e0dbb802e03557ac7a693d434bf8d04 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fd7c642376b04769fffbfa6aa0599ebca5dae56 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_241_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99fb935e19b82e46c23bde5749fdff6e5045da49c85153b8c53575ddbd8a7bc2 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47b325e313e820f57460727b0eb72b31b538bc8e --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_242_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9d7f295a32de24bc5b202642687c5320a35b36c439d07ea3590b73bc472e2ee +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bfdf955f683ef874c46f4dd0519bf3709887f7b --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_243_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75726bd2b64561449486d66b7ea47710b54781d9821c271bc35bccd54a8e6948 +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c4e1c98a7c92ba005bf0b1919670cafb99cb4e4 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_244_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9750949be76f49da4fbf9b7ca884016a8527bad114a0c43c91fd49c2e287e3f3 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3006a5d772d6f8d12a57c44af950c0119394c451 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_245_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb17be09341a350f96521f5405c7d7198ae83e0572758e9b737dc922e910c69b +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..accf54d5e3c47a9ba631c9a65bc58bc8cb215853 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_246_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f812a84580a9b0b459d830ac5288601568cf9bb24a8f8c5968c390e42e85609f +size 51395437 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e722988d30c66d46a9cca960c08be2e2f8eaed6 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_247_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c85f806cef07d0b16bca430a33222888814b72166ebc9baa91dd897279120f6 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b3659f84a3a8c6183f5f5eba7911c389f6abe28 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_248_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4919284179cf3058b382068fe5c2473585e407818199d89612764757e5c74fd9 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbc7074b18c57c2dc3b4f45c611d2a6b7cebc1b5 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_249_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1eaed6f6e2d0b5798e63c05b6c51dcbd4f1eb341f420a743e3beb3147709d2f +size 51395565 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01ca510a5e007c6a31d32b79edf7385359253380 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:797048ec74da10e92a057bdb4a52e799864c0662df98c1b6b3958ce643df0150 +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90bd2abcb7f1ea6179025f4eee810aa38bffe68b --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_250_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a81f16d322ec08f4a5129cc97dd68153a95a58618d52178947dae18a0e3a068 +size 51395501 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9633f1c0929bba82e5d9dc3a8f4983fb597a670 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_251_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fa68add4ae41d5328a53f29a3cb7b6f445e5ab22e36dc36a9f118874dd19c0b +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f354d00c888c2373f8bc96dc30f0b9f3cc02bd8b --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_252_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:082c9e168c10fa854ba09bc5d784740a195f5b4e1a1a7414bd0b494293508b40 +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad2f6312851a96c013dc85db4d98d53df4564f94 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_253_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0958a0d25d4c63c67159d4423b9becdb5155d1e361991d95ee901059fb44657f +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..931bf953d967388b298e2bf349afc3c2c59415a6 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_254_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c2f83b007f5a849c2be3b979284e7fcc4ce59b1d33cbee2d4440a313562c7bd +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b48cdd7db1a8a61c240a71c0af82b560cab57f1 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_255_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e16580c65754930ee6072242f5e008e7a4aa8e243462182505ab6ceb090fd4a +size 51395373 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8963d8a8d5b4b3ba34c0c677cb1e8ebd753722bd --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1825cfb1ac354c9bbe021eb23bf7bd6bb2785633cc200e0752465e588feac830 +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84b1da1f8baed9ed0dcf66ba8fee3e9cd70ea21e --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c3ea6223abf7644fcfb74873c9a43ffce34241d0032e82e482ef4acf99148b0 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2e5a87b2b34c5b7a30176de7214b17325dd26e1 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ec1d421ec07991272eecf3474aae1a233baf1cf9ec81b0ebf2bbc31a76952aa +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..629f882ef88925d1d4bb540394cf18b05fb08b84 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6284e291342002ae676ff38e058ba7bea4b2111d213ccb77de69f1c7e2000e73 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dcacff40e539ccf7331ed392749ff957f35e015 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa515f6eb8a2bea4a4e66f5bc5d11493f95d191dc99c2900460af42610edafa0 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c4be098d9ac2bd7389759a5bfecdad106d89075 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1278e816c4f2d310afadfbb884eab64246deef20519d94715df082e75b345eb +size 51395351 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08687415cb661787f1436df646806144aaeedfd7 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb659255ab4a4b3d5cca5f84933991154e1347b58914ae8336a45444c384719 +size 51395554 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..578d9716ea30ab57386ee41d35bb457ba10b9c14 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd8d9d02e98816642083834bb022f12076103cd3a7ef84f72f9f1a399c52a7a0 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d68b7e7f8f406a2b10145b0d755ba740884eacaf --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4038e53ac7cba89e9e29dec33bb7115d9cd0beedd4d32a8009391f42e5fcbb6e +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1275223e671e64706faa4f9763d9b860f1ac8ff --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f150168417bb8d1a07fb2931059bcd3e60be9c56012f7f3b1eeae80dc7d41ec7 +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87339f4e96d944cf96bf94e51ddceb793a903c51 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d616aaf2739eb8191388f18eac61dadc7ac736160d7f57b7720aa7fb52c18644 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d0a45f650a2b79517d88bbbc9b52798f1a1f2b8 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f24321eed036def71421fd32497abda8872cd8e2448637cfbea063ef9afc9e02 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a77a9186a036ed0f2ead1f6312ba64b60ef9269 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44e3abecf1e715d2d62fbee30fd9b1f46cffa277db9d1beeb808c25efb269d57 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d102120af490a3222ed32d88a1dc79b1ea8fba9c --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3932d67befa4b940a909aa793aac2916cebf58de895eb74c2598767938e9e315 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06105e14d0273cc02235e619287c5483391f83c9 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:514c1ad7e58a13605584846dac171d533be545bdedc20451e6743fdee1d4d1ac +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d74ad4ef5673097bfcad968ca8944add0644bd13 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e7b9e6deb7a7561d2a9e9e416bacbae652f72b9d4424c314b3de486019d05f +size 51395554 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49a291418cbff1455945c91627dc5c650bcfb518 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec109ddb9f130aa482fe5f123f491e3fde326dff0bbab3da3a32fb39750fc789 +size 51395415 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8f3add34c555a6905844cb93cc5905de68bd3bf --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e21f9b05e355556e572c0021e268d64f1471ab3e0461c5287a6f3876c574cb1 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e6ee8c2c3539d766120fe28f1e901680d9f6de3 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04255f8cac0f3ef0a6362503f47bd8e6b02cfaf4cdae93da494ba6e2d209a791 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe29c04a13e7d5cb8ebd5bce47ae2cd58a419c47 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc375a0bfcd5ab38d83781467a12da381031898090ea5c1b945cdea795a6e0ec +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c845daf5ac42b829d8747a9c306d09afd057a88 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c651f93b7b4694e3cb4c25a9b32d0dc3faacc82ad0bac89c3f9d0c79e6301a9 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67c9f855f22ec875594a20a3b6b70823f980318b --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ab2ec754d39afd6e02566e7df17f3e678a7eaf69d0d4571338dcf3f754a722d +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfeaf570d8a05b1afe0ea113009c1af72f22a0c2 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b588f8ba3945d16747129704232dbb72d4e7ecfaf1f8819812d973d96ca727b2 +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e35e39f044da4e3ce9330ac0a001de422056363d --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5286eac6d03cdc37f05c06b2fa6c2b1b8b9959fe77fd1074637840f9b1e2a7b +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..518173087e28f34849d533137fb54226aa7c1957 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:965febc9f7798bdd8c47da5505247f741011cecd6ce6d843279512aae59508fa +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..578cf627f840e2edaa74badf005756f8863b951b --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d8ca25ba8a766133bd99f7723955f517cff35fe1ccdfbd526ae25a6d0a26a03 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17db3b0536c59e6cb127c1926d1de332abb8f74b --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64e5226d5ec1b4e374f67cd1d1e4efde32641be0ffff48ed807cf23fb72db6ea +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22586b36602af630e1a7c281b5cd1e6ab609d5b6 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5215b9e0b9e5307a1ae5d340aa103b058706bdf30399915e3ee6fad030f6c91 +size 51395415 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8110da3a0b6c861d2c9b0481dc6af4249b4f6da1 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cfbd85600f254b4570f55913be0a2e45af72b1f7f58eb4d3c89b48f8882faa2 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54843149ce5ccbca69bd08670514c12de454541e --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40d4ce6716deb04970b5918388951fe786d7f773f3f24a26ed83da3051c08526 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..285da75383341dce4f1844a20bd3006057e5761c --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0f186b2831a5f1de9e772c4d38cbed6336ccf9c5bf600fbdb9e7d26d4ccce85 +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e954b6a91335f65272decc4b449b4ce8fee72a74 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bfa5c29fc5d41e41239131a32c1655d95755f3ddffe5067162bb5845471ed66 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..156c05a2467b78b21610f8c17cd8b1f4e9fe805f --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea6b3519fd58c92ca0ad3821cefa0d0426c8594f8c80b73cb9d1994a5573c5a0 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfbbe76bb7bddfe8b3bd9cdc787fe855aff6fe0b --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c60b461cb4853974764d524a6c6f0111061e9aa191c59384659761d77fee8416 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6a24bc713a0e6a3f39e8893641d4b460b90f91a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:733f5683d87a1feb158fd9110f0994c75ebcb80a0e55af4d85b847429dacf766 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..946f20b76d8308c427b7b984eda379648351c38c --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfde254fa0c8fc5a1d20d4177c4bcd5077e55d4efb2329d7386815169471ad2c +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e81d480c8dcd8d4b0ed26285541c507550d32205 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f91c916610ff1736b1a61f5b2152672891723cb3503e2c7bfa297d39eeb14ba0 +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ed710a2f1bc0089d017852270388f8c59d2258c --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1b6ae2b52f45543c48b4185d837f796c64a07973e1f2bd59560958e6fbcba42 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbeccca86dd4dc9940785c261388e6b7ff972e9e --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72ee2b3b00d4b0394e9867357289c0f882a309768fc865f458dfd46ccc497da5 +size 51395415 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06e111d5fc6b2c6e46a0659ea77a4c0e20a16303 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:009f995548a288cd6737999e6be68db89d0a5f6175494e92d99764eb1fe321cc +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c255ce1c17be4bdf870a45897bbc04644c6a212 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8a5bd5fefead1d3d2a60a3c9fc7c088da431b8b4c041abc10225e44a3439e95 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34bf7760e97655b0020e98b18257178b1f26abaa --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f64f44c8321723f81f69ea03873ca304617e83c463fe0b80da91692192527e48 +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d96a8db49a2b1f1f8ca6046d561e57fd3d1b8eb --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:600e94645f26e0d0e4b47e1d10dada65e41bde6e11c4b1e16f7291df044d0258 +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec47e004b384b84dc2cafbb3e7c110d805852ab3 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c5908471f571f771f9f258f5772f6012fb949cb65b257856740a86935818da6 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7cd6e5c5d4357937870c9c032a4397161fff5f9 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c85d12723f87262d1c6f28adea7c70c4d157efe89ebc96a992549527db755b6 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab3bef15ae51bfd4facaa42c9ccc96dd7ff71302 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e25984915dc77442bdb542dc20fd3ce7ecbe878cf3a11c56f4d9fd6a20acba0 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdebacc0e17af2adbf7f02f52c7e341ad3ea8ffa --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f72d42ade1bcb1f9f1f8976d3b6f6ae4e4c85e085b22fe1749faa9c1800e5be5 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b2e362c091fdbc91c35a6621e9c13a0b8331ceb --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0575cb8749ec85342a549c763fedf1bc2b4c67e046b448ecbee6bb92fd4ec5a +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76a65352e77bd84fba9d332a3506608bb9f73963 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35bcbf8c0c4aeb728ad3d3555adc0f3324c27aed42ee68fc2c5873800f5733a9 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6ed0dfd9cc1595731043e25794ed5539d2129f6 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fe4ba50378d12dc68ab2600820f0a085157bc6730685bb7cc86e503bc23f063 +size 51395479 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7001e5fdef434801712de2cb29dc9375cd019b4 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a625bbaac1d5ab1730a617842d500ea4bfde4289955d560fcb33b095b3af7ff +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..499bf40478c34d74c934f92ad57f3343c18a0728 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fae9b27d0e9f3e025a3603eb95a685519450ead2c6efac74b0852066a7f2d30 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f8ba330e2baec9bc53fbfcbfbff4c4c186ffef2 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:875629e5127c861bb9f39924e10fadf63fffe2dcf66148ebdc53205ae85c5956 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..815155eaec21122d4523d4a69516c5e448b64295 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8aa0990df69d61521da12c71208598846ea9377d4fd59bd71018ec7d19549 +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b038610eb5affabb2cbeda9016263e30c9a23b3 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c82a21a8bacb5d8484f3e86d12bd928969f2ffca683227923b35ed62299d6b2f +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f54625583f849306c7ad3e7a552a8825e64ecf5a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d66e127f3749ec467f5d55971e3f322697b66ba1c5032ac3514db2b56283494 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44c520708be3bf4be15030c4a0328a22a11e7916 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:379033e4cdf1b435574430ad9e8f7fb2b2f8738c31aad6318ef9b55ee171d962 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..646c57d54da18ef597f9ac76e6c8860ac91a1995 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9edda3e659d934a1f5c4351eb9c07555551fdae81090ece5dea1a69900eb4ddc +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f60cdb6a066ca77fb56ad60d3941b45fc8c50a13 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88cec8697b26f1eaeb45314225a63824da2bc98b9854a7e6d151ad09403e2e61 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38c1f6ff7f954259ab1c29e3f595e4f02ba88ffd --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83cc8b8d87cae8a07a996ed78abc7855f50ce73bc0550c6470594dcf9ca25b90 +size 51395554 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..198968c693547f1b345cc1ea9daeb493712943ce --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f251f16b81b56364a740f5426e919a45e73d49687ed3f0037611f961f258abb8 +size 51395351 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bb1460757e402a5bebde98d8652511ae75d240a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ce872de1158027d01346c066b996b00da7ea788f7f0c8281086d644b36e5623 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d77ddedce9517b4cd025f86f026e1646e4c4b3e --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4aa4d42406adf73d9b26b4d44e00b82fc55126d2455a13af5478458ade4b2f4 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36b674f9a84a013719673865b0a28d4fc928d8d8 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c34ace21fc93fd7f5a8ef4d550683c7cee9e98866fa466459447344b1fd2cf08 +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5641f0eab063d3b84274756737f72af2d35f7176 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cf3827f3ff4cc3d1c86d2c20967a9804702dbe95466e8354f63163f49db1a88 +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43cfd6a1cb6379c39354faf4b8fc95e6aadfeee5 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba65fbe19f5942cf3864e93dbd5cf8307fc1bcea102d4f6dbc8ed66f3ea99d33 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3470a175cd2089186f13b47a4f8733f24af81806 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61fc5d8066cb4a6f81b6683e5bbf2a35411d059f9ab02535f353b6c82e7747a1 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a06e949569e98fc3be88166fd444c480e2f1e49 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff8c9813d21f0e9ca15e5d67c7927ae0493da9981c3868e9e524e24a9658e312 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ace32fc570df90a872cd10800edcc816ee542f1b --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04d336b65781b1e0bee1741401689c9aaaeca3a79ff12036bbe832d7aad72254 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b2d66348d928d098880d5bf2c9dcb7d5dd36780 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3411fc2a07ba0f48a785ff132bf2e925c85a5e1b2095873c0c9da27cc54ab0a3 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30a5e72dc6eb2c6f963324fdca1d51d1c79f5394 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2676ac6e66514766c8baa698a6c14af22c477cc94b12a98cdeaa7cb810bfc90b +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0923dc038f4638ee2215f6f43a9c038af52831d0 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d504b772c821f28d9061ca72af3a621870a7e4ebf064a994821be951c3fcde93 +size 51395351 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1bb22139b79ebaf09980de72c663a3776eba8fbd --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5a05589904b06544d2f81b511153f8eaf348180975ec645d68fb8d54af0b074 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08f600f82836cd89f8ef76e6a983d365b78e5749 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fa6d891f29866f7b83a402492a36a4ae02fdf94f5de50d0d5b0dd0acc99edf5 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed60b88bd9581a9a344a03e958292dc2be0e4dda --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a286edef85d31116f8cb80468c089cbf1d0b465dc80300bb127549051ef5c424 +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5762368f868bb6e03983b532c352bbc773201bdf --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1db637175b21b03d89c62347de3fb7aa557e43d265439723e8ebd69902bf23c +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d13bfe2c2dc0153f3217df58966bc64a55152e0 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6bf8ed7a25ec92a2a1f297206d7d23ce468261e8d8c661b708af2c5309f9029 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..963b7699697c102a8d2340361042c3c824af1aa7 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea80436b63367589ca5f718a36b2383e9d895e6668b8c941b85254054da51821 +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97b7c2d231730e95f16f0888b362e4a677925287 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f447c11d5481ed1df127a83e9a5abe95b2292da486b968f5e52cb1f382bca3d5 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9878c9db48f91a71ac1cae274b097a2135410551 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97617eec6fad4ee0bc992538d42a0efd622598b95463220e471c7c6826460b5d +size 51395490 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..231e37786f4c72c2e67e5275065800b296164c93 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8954034b051fe5d81b988362d3cec1d73144f3ead2a43bc9996a8db00521269c +size 51395362 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d97300f44300e1b1ca501a171d40bdf5a6b93ce6 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84551360af14e1cf5cd9e9e9135399f74e8abf1c8095df1b1b5e9eece3e5c710 +size 51395426 diff --git a/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c70c431fcf0c35fba1a95605bd2fdb8f2e31ed09 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e3cf6f7528618d67f5c148455999f9771d2ea1c2ca23f72fcd0c25f23f64bc4 +size 51395479 diff --git a/1b121b21bc4seed5/global_step39672/layer_01-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04236153c18ecab7b8756a4fb3c94a3c2c5441ed --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ddd0aa48f1f65a62063ba1029af2bd0295f7e0579e2679d1f92964643905f4d +size 187630851 diff --git a/1b121b21bc4seed5/global_step39672/layer_03-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31158fd11dc541e1d4f6f2092efafc97bda15d64 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1c042da27c916d7a0f8a3f1e5a8066b54c1bf71adee7f96185519f7d908b593 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_04-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9de90f1fdd4854388dc18aa5500aa0c4e244d51 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:265b83907b2b708eaf208f700506a1d2d06ed8fe469aec74ced13956f0d045d8 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_05-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d78276b092979419cbf8ae741c1e9aa17fbb9e94 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feea0c95069b3669dc1d1a7e73f4038474b6ec89f7b90be4a135493acfc03258 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_06-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e792cb0f4a6ab2a11a235572893a3575f183cc40 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32ec36aab5dbc0c11d784129d3435efcfcf46e683858956acd51ceec7c1d7b8f +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_07-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca5aacba036ebfc0272bf6688fb5cbff9877064a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a7e6375f0e83a93c29c9e30be802c9bd360dab0b3246eee7919b4070cd0005 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_08-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..040e7dea0a3b31bc7dac18fad54779cb53913360 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ff14baaddbad329f5ca96fa484e89b225102a6b9f97b8a26d6e6b4c017eb251 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_09-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7425be72d916835da45e89f3df923042623760ff --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e486e9b62c175e58a906b82f2908ea1bf6f2f71894bd94648f702a0ed77549ae +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_10-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01914287559ad4945af4c2a573c127968332cb4a --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:205eba4b96e0ca4367c8701ee1b3df93f8401be81bb0abeeff8455517d95cc46 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_11-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75c1ce3b6f7dc09c8f0687328464bbcacf919796 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4c03eaa6176306aca338977d5747a40569ffcfd18e92bf1a8bb4267faf536f7 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_12-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9af1f99b3cfc2c1b1862e2c351109961c413bc54 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9462874bfd24508b94b72affbcb674fe8d44290d006d9a837f87f4a38b87c916 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_13-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90b6d21180a2e0b74efc27b67b8868c702a8266d --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66f0e186774591e794341526d3efbbb3c63c40a2c7d75b31940286bd8d31dc0c +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_14-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d094d7b21b241361b4467d9796feb198fb99488 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dbd8cdf052eb95a81c97ecbe5315fe771a90cc0554b4de1115de4a3dc54c601 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_15-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a216e82edc2b001896043c1488f848819cf7efd --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e4b0a4229dd7c2f91ec66cd403216735209e75e4bc52dee16668c056e054b22 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_16-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0423a078f2b9525ba022ae124d0824ca90e9792 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe11cd70a361cef312c7c21eed8354bd0cf4b20122394f95e8c0c05646c286e9 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_17-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6145e3b14d760f257f4adc02fc3957ed526c87e6 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f1315e9f03446f6b46dd12d03c2ab7759c79973f99e0d48629ccef900c0734c +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_18-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..774503542c061a1bec3badef9a57bc5975d4de98 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed133cd55766bad6a292799b6b2ced95c436114bb2b550bb966aefc0cfe3d83a +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_19-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc24cecba6c21a706cc23a011060ca9586efa0cf --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d019073011165e2603cf6ff4aa9c06063309cb86dc16e852b9eed007e946850 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_20-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f390285e1403fb3450ffa77c3bad4a257ba28da6 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0a1414dfba70d9886e669e09f8eb4275602840176c646893106af1143252af3 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_21-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe640bffc2eb01108e5878670efed4f0e02c4e17 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfa58f5c3317dd50b8df105745b2e0aa0fbd657bad162df016d17dc791bed6ff +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_22-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..641bf0ad378ecf0a7bd4fad1f000c85bdf00b843 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa9030a6813b7cfad3cf71092562e93c5bdfc09771d90970c754e1fc8dcdd2c8 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_23-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a6c19343c405b91c79a63f765258ad62dc49a70 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:904c934b051494b6901670ffa1870b85e1edaa4dd44c56e316496377b8ee53a0 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_24-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..deae920629fb2a3f384b7f2aa9ee323863c816a7 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc6a663ab85554e92bbe65645272652b75d9c317d14af9a7ac39a1ae086752c3 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_25-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af615db3dcd5fbe92cb5c5d1d3d66743f048529f --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34ee15e99b0b11668d0f0b0b0dfdc7a7238f41c110fb733b66823acf45d16837 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_26-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dcb7a252637218e80ba1ba5aefd556c5e43c715 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:038963c5227005be6d795b82f97b1bc40d44ac4db31a619b8d0e162a104e8d3f +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_27-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c359432d37a1980ebdbd7ad9187f58a26bf11b6 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a8a644f8b8e7e4f8811ba3f0465300f0b0f0e87c3dee8ac5e3afbf6ad56a303 +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_28-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e48e2839a3e700a881dee8d4dc21de658ac22c4b --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbdf9f9f9b7e4d50d64c67ed7d22e3c49c46094e87898904bf88d0906e0e6a0c +size 77121283 diff --git a/1b121b21bc4seed5/global_step39672/layer_30-model_00-model_states.pt b/1b121b21bc4seed5/global_step39672/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..456b2269ec08c7159771a9ed98aba919107053a9 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27e27d0d47fb3a7f66f39c6dfe204b48e17e4ef2b4ace932cc3518b386f0bf8e +size 8387 diff --git a/1b121b21bc4seed5/global_step39672/mp_rank_00_model_states.pt b/1b121b21bc4seed5/global_step39672/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eba080acdad5b13eb252985cc6553652c1de60d2 --- /dev/null +++ b/1b121b21bc4seed5/global_step39672/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24536acb753575316249d85f800f10997aa37a9c2538405e459af5f1254308c8 +size 43827 diff --git a/1b121b21bc4seed5/transformers/config.json b/1b121b21bc4seed5/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..7120acb75187622c061f0425674b658dd9155502 --- /dev/null +++ b/1b121b21bc4seed5/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50304, "n_positions": 2048, "n_embd": 1792, "n_layer": 26, "n_head": 14, "n_inner": 7168, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/1b121b21bc4seed5/transformers/pytorch_model.bin b/1b121b21bc4seed5/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..307c50978851eb1814e378e4cce20b0fd1a60bcf --- /dev/null +++ b/1b121b21bc4seed5/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdcba18c02068b3c7fc0e6568652943b2bd1705dae1cc2a6cdfa0be11b863276 +size 2410895501 diff --git a/tensorboard/tensorboard_1b121b21bc4seed1/events.out.tfevents.1674660087.nid006651.126730.0 b/tensorboard/tensorboard_1b121b21bc4seed1/events.out.tfevents.1674660087.nid006651.126730.0 new file mode 100644 index 0000000000000000000000000000000000000000..0d35e070ec240e16391f75d7808bc9034c3ba032 --- /dev/null +++ b/tensorboard/tensorboard_1b121b21bc4seed1/events.out.tfevents.1674660087.nid006651.126730.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0a00fe1ea610c514a1baafeae6172f2d115664659fe6f7cacc9307ac3433f3b +size 71272426 diff --git a/tensorboard/tensorboard_1b121b21bc4seed2/events.out.tfevents.1674660087.nid006899.126955.0 b/tensorboard/tensorboard_1b121b21bc4seed2/events.out.tfevents.1674660087.nid006899.126955.0 new file mode 100644 index 0000000000000000000000000000000000000000..93b324622066811ffbe61b61edb0236fbafa95e3 --- /dev/null +++ b/tensorboard/tensorboard_1b121b21bc4seed2/events.out.tfevents.1674660087.nid006899.126955.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4615f6fb4e3281eaf68908da482ae415a8dbbd6a7094d3b76bd17646c1f1f613 +size 71272426 diff --git a/tensorboard/tensorboard_1b121b21bc4seed4/events.out.tfevents.1674660087.nid007141.44159.0 b/tensorboard/tensorboard_1b121b21bc4seed4/events.out.tfevents.1674660087.nid007141.44159.0 new file mode 100644 index 0000000000000000000000000000000000000000..313491bfb966e20aacc3907df93715c87db23785 --- /dev/null +++ b/tensorboard/tensorboard_1b121b21bc4seed4/events.out.tfevents.1674660087.nid007141.44159.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e59ed4a98ae33d56dc8675f55ed61b6fa543c2bfa8cc0aabcc98583d09b7f5b6 +size 71272426 diff --git a/tensorboard/tensorboard_1b121b21bc4seed5/events.out.tfevents.1674660087.nid007121.77603.0 b/tensorboard/tensorboard_1b121b21bc4seed5/events.out.tfevents.1674660087.nid007121.77603.0 new file mode 100644 index 0000000000000000000000000000000000000000..373992fcec9f27caa554a284206a726e0a075a6a --- /dev/null +++ b/tensorboard/tensorboard_1b121b21bc4seed5/events.out.tfevents.1674660087.nid007121.77603.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84145c2714ed6d568e5cc9f6555e26185810e4def6d7cd5fa35aa4e29cb2a4fe +size 71272426