diff --git a/.gitattributes b/.gitattributes index 1cc57ef8f90d95ad13febc5f269c72797f77c622..118bab74a516326954c6b9e5914cf080b66369d0 100644 --- a/.gitattributes +++ b/.gitattributes @@ -128,3 +128,28 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text 8b7178b35b/evaluation/generation/examples.8b7178b35b_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text 8b7178b35b/evaluation/generation/examples.8b7178b35b_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text 8b7178b35b/evaluation/generation/examples.global_step84877_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +*/evaluation/examples*.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_0.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..922f290b55832e94a5bf10d0e114ee19a85712de --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.33618386090404295, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.043286547374004225}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07608115633976532, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0028424335866037475}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.243734587530279, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005032751672173048}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.09550360928926843, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021611192824620468}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03391274645846755, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017782441786429572}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11477361563470867, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0030177112931945443}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04353421604632926, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013022741040944032}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07249954185930807, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002716866763111571}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.23447583587320983, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004820896551192642}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.0908905716888711, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019748576875776485}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07260565563718514, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0027622865524293628}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2312007323793673, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004666750865618609}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09063319866429098, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002018782468480028}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_1.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..5ddcc294b9675174bffc86ef19718c0d25a78aa3 --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5152510207869508, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.039697768768641464}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1335251141437586, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004421796872864802}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3040669240102272, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0049926465687368735}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.15419793855600986, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0037752055082234935}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.06857339375782437, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0030273264083127568}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1555986112064758, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036341014671041087}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.07820906828691397, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0026222161094111586}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.1195649771956543, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0038518942294089972}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2838951533263151, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004599064364517073}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.13965714245032726, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0032487392690607572}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.12140487798820795, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003915984273012587}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2857833042522088, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004601461544101827}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.14150307262693815, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0033007395324502467}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_2.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..ea1f0b5984f60c4e2c842f53e36307deda1647a3 --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6450721424031474, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.035938592978876936}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.17715496451419446, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005377686826508908}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3442204927205235, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00499209962075588}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.19228537050298922, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004356183491682661}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.09659406582034752, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0036720254666308344}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1816245156374427, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038421174433974025}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.1017490401630499, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003080557280075834}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.15519367504713033, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004580706449804959}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.31893881029765586, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004597766706728441}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.17158392384169643, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0037128302671958994}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.1592800915810083, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0047149524911017215}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3221825821541532, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0046252310161258746}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.17498254398589475, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0037985612156152086}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_3.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..fa4cadc5fdbf949f6f6258235e84525a7ea55237 --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.8785043636862591, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02652000083973547}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.2002191357399255, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005700191155087746}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3622650735119951, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005105318033672305}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.21217682060449367, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004581243352642801}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.10955905558045385, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0038849982073218873}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19262377036723086, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003902442560309681}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.11312048852329888, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003186877123824252}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.1744946205047383, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004899868234689971}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.33190561350734876, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004628476785750535}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1874319081280966, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0038899168243038715}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.17972186968155374, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005058207025529124}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.33723235220496645, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0046889691038068775}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.19207381785134825, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.004003703743860644}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_4.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..17d0a4e3c3902c6b7cf6439fa7f1cbd3474e8d82 --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.020225734756704, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06946466420275214}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.21447559212644274, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005787602630220149}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3797811786576114, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005078572769442694}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.22615455778377724, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004584303113870005}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.11802182161980528, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003954053081043237}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20495230642568182, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003956396099130858}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.12153309984630654, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0032009564132827184}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.18574729294363898, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00493965653212434}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.34661430398431914, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004643977843173891}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1985084531863174, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003863020108912202}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.19295820334137398, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005149923293184489}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3532599821115898, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004685486372918684}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.20493355705865743, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.004011218572127487}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_5.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..53933c5793a8aa30c8b87a1301c811aee8ce78ad --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.1738991703843653, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05137420728965795}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.23842752486609714, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00616558462817229}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.39104608539227964, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005079097315439687}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.2452749113827306, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004866057995099286}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.13743673376990653, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.004448566773563913}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21617363071605727, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.004065117072186819}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.13673599319945717, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.003545382189555846}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.20669362004199143, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0053303444381744315}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.35345362943589836, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004581784867877382}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.2145149869812429, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.004135695136449003}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.21482050441032427, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005549487778372521}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3612051449037077, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004657096205531439}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.22169261840373009, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.004292938565416988}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-wiki_lingua_en_tldr_en_0.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..98449f52256b6c38bea78102d15a7c9eefebac58 --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.16222110345712215, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002918181626000938}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.23556142979563985, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0035092798940514463}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17281704832161807, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025639705499622615}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04035916262517482, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011089852877097363}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06187933259063034, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015927286355937283}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04445750772336212, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010694173040695087}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.12115800294799915, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0023302786580353405}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1793437869920672, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0027904364481447434}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12828595447707558, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018630698897748783}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.15193645088089489, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002794596188541928}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.22017606445792967, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003307741344782461}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16125234602130137, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024054029356366125}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.2204812581094187, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0968937530189579}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-wiki_lingua_en_tldr_en_1.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..0d4656cc502f82d5e6ce710b38f6dd75bdf33adc --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.24835405674131716, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003595946507957674}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.22065222520601965, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030326234032250735}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.20057722026752264, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00237727127672953}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.07072572329707479, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002023483136430399}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05888749376061464, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015271270172799948}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.053780768787129375, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012652221510456923}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.18962847615836217, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029056148560385174}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.16669593752772216, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023452388157941375}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15099195793433165, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017939149386485946}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.23119707647225618, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0034029730598757074}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.20514467867088854, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028358663517956315}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.18619742012806825, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0022080861119325576}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.030764799858383, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10180137949258324}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_0.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..8220ac26714b3c58f189eb667bb17b40deba2d45 --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 1.8080075016885704, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.061027545228237855}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.1356910382997071, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015410643240858764}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.2778453886224831, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0023539268248121705}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.17861979049522314, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018002125016461491}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.03490809623131593, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008357898041576343}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.07284634942140401, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015701168954429102}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.046215425350075, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010566397123776003}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.12227403244327856, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011855454993101654}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.2551033251187225, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0019031145709281366}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.16201597249905292, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013971090679042123}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.113242028542405, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013998996791185847}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.23203443734017606, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0022390418934348437}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.14908466648922475, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016626826909044133}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_1.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c13e863b28208889dde3b957de50697e79ac8eee --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 12.173849341913149, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0669092468478733}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5970385739901486, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003272991717133695}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.44205108840831364, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002990943407358534}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.48129644782721304, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023219173855042303}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2911262146867607, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002892523328423528}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2107609477318019, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022166981158979714}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.23032000484043905, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021147211593944798}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4377488624210833, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003110832463080634}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3198170788492075, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002444190246186975}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.34966965256911114, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002108342891501849}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.48957738460024036, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00327157474691632}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.36068779636155734, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027524175233159713}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.39331173897680705, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023364505709058668}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_2.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e04e01a91fba855162754b3be6b6b84bdddc7099 --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.360624153571306, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.15724700369597677}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6032331597687249, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003142877448057622}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4697575589134947, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029526957130554953}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5041317140273615, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022753134233410278}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.30851618494266825, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002855313490834544}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.23616858770973606, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002325964607821345}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.25374280478792693, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002169411661246531}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4477614821909179, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003011118677636196}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3459816794847227, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002532543665969986}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3721296496966484, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002164018647000424}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5054563233222107, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0032185989379280733}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.39233324008569126, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027964602331100393}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.42160904040581204, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002384317338752149}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_3.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a9c4c5886e186222466b8bc913fc37bd826a6668 --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.173778916293744, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.24020125390484678}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6038782195503243, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003130218028564903}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4797961783746489, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029264432136497623}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5122282123885756, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022794016747342454}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.31128306325561933, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0028044649859898306}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2447494516430458, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002368198668181156}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2611392423531194, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021928684064362373}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.44868202075612884, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029681578589764264}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.35482043982343436, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002532913929369527}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.37928627551530325, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021871071072142663}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5087702457406414, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031818356512290486}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4036850753818513, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028061971662930287}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.43123333798993546, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002401597688343299}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_4.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..3f0f4f3578743d868e19dc8e78e33943e9cb69df --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.78836334652692, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.16277087917874616}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6052306848983445, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031205758451821283}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.49015291142822803, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002870806275113502}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5201963806927633, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022664890545995124}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.31194428367362853, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027609843407215874}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2500276639929066, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023425058959290804}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2653610425045864, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021838284720614534}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4475978408946653, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002901824428209634}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.36147111146407906, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002523200720958866}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3838642484464721, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002185515405072229}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5110579537103325, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031404148777386892}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4135967411759738, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027946622087117543}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.43919378367441203, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002408659068024605}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_5.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..3e787f628b34f5fb799e79dc50faa25cdbebc22e --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 15.879323420491742, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1522927233333457}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6064323245894362, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00315510278665659}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.49013366730559393, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028136604439425025}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5216373530710218, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002262224044659468}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3150817079641561, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002829192112850875}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.25132514912770915, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002318826430015561}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.26786622625063644, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002208434520877025}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.45023806138186195, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002949168521598567}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.36355539000425124, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002526510160020316}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.38681699896646954, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002220989687079745}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5137337228447252, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031936836223124105}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.41496788459604567, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027605438893900454}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4417889417099761, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024158193931717187}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_gem_xsum_article_DOC_summary_0.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a5e86e18b91a6e3e7bc8ab46fd6d8c4e4c31064c --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1512189693389312, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002590198483449934}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.32951007687075756, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004923756202298708}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20062931818668506, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002892087092668822}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03240083882273609, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011887319293568278}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07461053739480651, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0027791525130900266}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.044133865209903714, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015693045278532822}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.11056422701824653, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0021853162208514175}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23921769394978765, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003783594428094317}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14533977808404885, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0021630231020242576}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.12055829236568064, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002297890666943901}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2623026232832005, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004182995633448934}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.15912733837926105, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023937408312475765}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.9472662234201847, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0954010664780363}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_gem_xsum_article_DOC_summary_1.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..037da320a295571edb694a6ffb02bc03bb271749 --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.2431489069099882, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004319149380207122}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.27274551008869324, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004181125297952178}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.24058051563117627, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003619950901783304}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.06156338993755893, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027090151794028584}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06564279411701872, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026141410795920464}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.05891708042714147, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002369248568269019}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.18703509762652787, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0036036431129194833}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.20956010556672522, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00345405751329193}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1845786738464429, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0030093215424524295}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.18954846036997042, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0035941447605698394}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.21418956311713871, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0035468160066617596}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.18768186260751757, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003017598467168456}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.857997728240847, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.15132505328438867}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/agg.8b7178b25b_gem_xsum_article_DOC_summary_2.json b/8b7178b25b/evaluation/generation/agg.8b7178b25b_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d06ee3e710a9f9d3cea831c598bcdbd72fbf8a9d --- /dev/null +++ b/8b7178b25b/evaluation/generation/agg.8b7178b25b_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.25234682823435783, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004406932928762655}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.26739840698638306, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0039999072862688684}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.24657160673903905, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0037739176215048444}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.06567480327233229, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027842377535723913}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06599412859644187, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026775951767211374}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.06271701269177109, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0025663699767628305}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1921361411782326, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0036263536814562453}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.20386135964058816, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033147209011893724}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1876781101224112, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0031437463539169125}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.19374913452852363, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0036251531161871544}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.20676693183261305, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0034014354284824795}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1896272533115015, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0031550558124475133}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 3.19195992073562, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.2067955639958893}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_0.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..27d7145d147c659fead445525caa29e3bde120a4 --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc141882d70577d64a629af820e65de857d7cebc8a97999f9b0a04b6756b2c15 +size 3823764 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_1.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ef8b437cce991986aeb7311bbbb011fbffb78e9f --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bd8fb2ee288e99c763f301203e68fc5701dd70af25cdf486443fddeb1dc0bdf +size 4753296 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_2.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..da1c8f547bd441050d2d6464f5d2a31fff4fa8d3 --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0629d66c49c4bdfb6040b30e989a4c82468f106e021681c1b1608074b60514ff +size 5581198 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_3.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e9666896e7d0e3c591b0e400edef8debf3876299 --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a5f06e44ce5a0d5292167f69b5ea9341d6bdd521d6b821fc907490772fdf8c4 +size 6444573 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_4.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fb55ac7c46a5e140ffcbc8057d9b92f32a668275 --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09fc8b0a1ad30d4620c312955b4b813cfdbcc6d6b3bca0f131467f71e81d6b4a +size 7305310 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_5.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7bb3f4e7a1dd75ea6bb1283566d906945ca0180d --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f5c1a033d961a41e6f73fdefb253ce551eb72a132d1d91b49e79d29f5070898 +size 8160763 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_0.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..bcb0abd7bb20ffd27cca56e4168e7cab4b7d7a1c --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a26cd8275bb29178938176e55b6b28ef9d4eb3e3e322738cf3c5561c676499d +size 7473474 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_1.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f17275c378c0923d6282b5c4638053c6b396cc1a --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fabcd86f6e3d6ae965d311be5686c99fdcaf0349f8ce37ac6148d8cc3738ba0 +size 12934697 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_2.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_3.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_4.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_5.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c4ba80945bb365751c58d3805c92c0a6561c5b99 --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:042e377741565300f5f3b1fee7bab0d6a795e88898ff638cac59c615e75ee454 +size 4370955 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5d7d066e6d61db052a373d055996bea3132ebf7c --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d80417f4d0f7e96e6b204eb5d7a0337652207eb2f0afaae00d5ab82d977d8e8c +size 4993617 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..83c502cdb07aef1a4764c2d877241ac63462cc79 --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:015082db438de64e42e87ecb9a43f2783cf6177c1a6d987c859cd64f82220217 +size 6087012 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7b1f2e9f59a2efbae2556a7f2619dc8cb27bf5f2 --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71006d431ef2ee5a581ef6bd6e86c446dd870df445222a426f2e80bdceb16aa5 +size 7174145 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..39cecb8bf7c34dfb2fc2170f0f2619ed547cb85e --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d91dabcfb680221adfd38c57a0a63f5bbd15c1d4c61412917a89b7034822677b +size 8257991 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1b5d03876df7982ddca20226186dcb72733b7bed --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eb99e8bcacf1cceee3459f23630184e1623d5e0c2835493389e471acb9b7e32 +size 9344420 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_0.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..aa4ba79c6a676588c2982611b238d31de8ffbf1e --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67cbd74998310a74d0017f07379277de7bacff9099822469958406a11163c290 +size 2794946 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_1.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0ddac151cc2888367876d37e27fb029cbe7e2711 --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19d908a094bf69be6be55681f5f8c23eb19561d5248275daf0a27cd9e62090d8 +size 4940129 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_2.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..30406ee7faa3f46cd18b20eb24dc31bcdb67bd0b --- /dev/null +++ b/8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf2fa19fe543554a0a1ca6b84862b145bc35b02bf6c9ef7bf719d9b69eb89a78 +size 7201820 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_3.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_4.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_5.jsonl b/8b7178b25b/evaluation/generation/examples.8b7178b25b_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/8b7178b25b/evaluation/generation/merged.csv b/8b7178b25b/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..34105cce50cee066f3752e3210f49a595101d540 --- /dev/null +++ b/8b7178b25b/evaluation/generation/merged.csv @@ -0,0 +1,39 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.046215425350075 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.046215425350075 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.23032000484043905 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.23032000484043905 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.25374280478792693 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.25374280478792693 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.2611392423531194 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.2611392423531194 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.2653610425045864 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.2653610425045864 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.26786622625063644 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.26786622625063644 +e2e_nlg_cleaned,5,average,multiple,0.2207741243477972 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.044133865209903714 +gem_xsum,0,median,rouge2_fmeasure,0.044133865209903714 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.05891708042714147 +gem_xsum,1,median,rouge2_fmeasure,0.05891708042714147 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.06271701269177109 +gem_xsum,2,median,rouge2_fmeasure,0.06271701269177109 +gem_xsum,2,average,multiple,0.05525598610960542 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.04353421604632926 +web_nlg_en,0,median,rouge2_fmeasure,0.04353421604632926 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.07820906828691397 +web_nlg_en,1,median,rouge2_fmeasure,0.07820906828691397 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.1017490401630499 +web_nlg_en,2,median,rouge2_fmeasure,0.1017490401630499 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.11312048852329888 +web_nlg_en,3,median,rouge2_fmeasure,0.11312048852329888 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.12153309984630654 +web_nlg_en,4,median,rouge2_fmeasure,0.12153309984630654 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.13673599319945717 +web_nlg_en,5,median,rouge2_fmeasure,0.13673599319945717 +web_nlg_en,5,average,multiple,0.09914698434422596 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.04445750772336212 +wiki_lingua_en,0,median,rouge2_fmeasure,0.04445750772336212 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.053780768787129375 +wiki_lingua_en,1,median,rouge2_fmeasure,0.053780768787129375 +wiki_lingua_en,1,average,multiple,0.04911913825524575 diff --git a/8b7178b25b/evaluation/generation/merged.json b/8b7178b25b/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..c00c1d8eed082bff1c15b03a9cdee95841cebfc7 --- /dev/null +++ b/8b7178b25b/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.33618386090404295, "bleu_stderr": 0.043286547374004225, "rouge1_fmeasure": 0.09550360928926843, "rouge1_fmeasure_stderr": 0.0021611192824620468, "rouge1_precision": 0.07608115633976532, "rouge1_precision_stderr": 0.0028424335866037475, "rouge1_recall": 0.243734587530279, "rouge1_recall_stderr": 0.005032751672173048, "rouge2_fmeasure": 0.04353421604632926, "rouge2_fmeasure_stderr": 0.0013022741040944032, "rouge2_precision": 0.03391274645846755, "rouge2_precision_stderr": 0.0017782441786429572, "rouge2_recall": 0.11477361563470867, "rouge2_recall_stderr": 0.0030177112931945443, "rougeL_fmeasure": 0.0908905716888711, "rougeL_fmeasure_stderr": 0.0019748576875776485, "rougeL_precision": 0.07249954185930807, "rougeL_precision_stderr": 0.002716866763111571, "rougeL_recall": 0.23447583587320983, "rougeL_recall_stderr": 0.004820896551192642, "rougeLsum_fmeasure": 0.09063319866429098, "rougeLsum_fmeasure_stderr": 0.002018782468480028, "rougeLsum_precision": 0.07260565563718514, "rougeLsum_precision_stderr": 0.0027622865524293628, "rougeLsum_recall": 0.2312007323793673, "rougeLsum_recall_stderr": 0.004666750865618609}}, "1": {"PALM_prompt": {"bleu": 0.5152510207869508, "bleu_stderr": 0.039697768768641464, "rouge1_fmeasure": 0.15419793855600986, "rouge1_fmeasure_stderr": 0.0037752055082234935, "rouge1_precision": 0.1335251141437586, "rouge1_precision_stderr": 0.004421796872864802, "rouge1_recall": 0.3040669240102272, "rouge1_recall_stderr": 0.0049926465687368735, "rouge2_fmeasure": 0.07820906828691397, "rouge2_fmeasure_stderr": 0.0026222161094111586, "rouge2_precision": 0.06857339375782437, "rouge2_precision_stderr": 0.0030273264083127568, "rouge2_recall": 0.1555986112064758, "rouge2_recall_stderr": 0.0036341014671041087, "rougeL_fmeasure": 0.13965714245032726, "rougeL_fmeasure_stderr": 0.0032487392690607572, "rougeL_precision": 0.1195649771956543, "rougeL_precision_stderr": 0.0038518942294089972, "rougeL_recall": 0.2838951533263151, "rougeL_recall_stderr": 0.004599064364517073, "rougeLsum_fmeasure": 0.14150307262693815, "rougeLsum_fmeasure_stderr": 0.0033007395324502467, "rougeLsum_precision": 0.12140487798820795, "rougeLsum_precision_stderr": 0.003915984273012587, "rougeLsum_recall": 0.2857833042522088, "rougeLsum_recall_stderr": 0.004601461544101827}}, "2": {"PALM_prompt": {"bleu": 0.6450721424031474, "bleu_stderr": 0.035938592978876936, "rouge1_fmeasure": 0.19228537050298922, "rouge1_fmeasure_stderr": 0.004356183491682661, "rouge1_precision": 0.17715496451419446, "rouge1_precision_stderr": 0.005377686826508908, "rouge1_recall": 0.3442204927205235, "rouge1_recall_stderr": 0.00499209962075588, "rouge2_fmeasure": 0.1017490401630499, "rouge2_fmeasure_stderr": 0.003080557280075834, "rouge2_precision": 0.09659406582034752, "rouge2_precision_stderr": 0.0036720254666308344, "rouge2_recall": 0.1816245156374427, "rouge2_recall_stderr": 0.0038421174433974025, "rougeL_fmeasure": 0.17158392384169643, "rougeL_fmeasure_stderr": 0.0037128302671958994, "rougeL_precision": 0.15519367504713033, "rougeL_precision_stderr": 0.004580706449804959, "rougeL_recall": 0.31893881029765586, "rougeL_recall_stderr": 0.004597766706728441, "rougeLsum_fmeasure": 0.17498254398589475, "rougeLsum_fmeasure_stderr": 0.0037985612156152086, "rougeLsum_precision": 0.1592800915810083, "rougeLsum_precision_stderr": 0.0047149524911017215, "rougeLsum_recall": 0.3221825821541532, "rougeLsum_recall_stderr": 0.0046252310161258746}}, "3": {"PALM_prompt": {"bleu": 0.8785043636862591, "bleu_stderr": 0.02652000083973547, "rouge1_fmeasure": 0.21217682060449367, "rouge1_fmeasure_stderr": 0.004581243352642801, "rouge1_precision": 0.2002191357399255, "rouge1_precision_stderr": 0.005700191155087746, "rouge1_recall": 0.3622650735119951, "rouge1_recall_stderr": 0.005105318033672305, "rouge2_fmeasure": 0.11312048852329888, "rouge2_fmeasure_stderr": 0.003186877123824252, "rouge2_precision": 0.10955905558045385, "rouge2_precision_stderr": 0.0038849982073218873, "rouge2_recall": 0.19262377036723086, "rouge2_recall_stderr": 0.003902442560309681, "rougeL_fmeasure": 0.1874319081280966, "rougeL_fmeasure_stderr": 0.0038899168243038715, "rougeL_precision": 0.1744946205047383, "rougeL_precision_stderr": 0.004899868234689971, "rougeL_recall": 0.33190561350734876, "rougeL_recall_stderr": 0.004628476785750535, "rougeLsum_fmeasure": 0.19207381785134825, "rougeLsum_fmeasure_stderr": 0.004003703743860644, "rougeLsum_precision": 0.17972186968155374, "rougeLsum_precision_stderr": 0.005058207025529124, "rougeLsum_recall": 0.33723235220496645, "rougeLsum_recall_stderr": 0.0046889691038068775}}, "4": {"PALM_prompt": {"bleu": 1.020225734756704, "bleu_stderr": 0.06946466420275214, "rouge1_fmeasure": 0.22615455778377724, "rouge1_fmeasure_stderr": 0.004584303113870005, "rouge1_precision": 0.21447559212644274, "rouge1_precision_stderr": 0.005787602630220149, "rouge1_recall": 0.3797811786576114, "rouge1_recall_stderr": 0.005078572769442694, "rouge2_fmeasure": 0.12153309984630654, "rouge2_fmeasure_stderr": 0.0032009564132827184, "rouge2_precision": 0.11802182161980528, "rouge2_precision_stderr": 0.003954053081043237, "rouge2_recall": 0.20495230642568182, "rouge2_recall_stderr": 0.003956396099130858, "rougeL_fmeasure": 0.1985084531863174, "rougeL_fmeasure_stderr": 0.003863020108912202, "rougeL_precision": 0.18574729294363898, "rougeL_precision_stderr": 0.00493965653212434, "rougeL_recall": 0.34661430398431914, "rougeL_recall_stderr": 0.004643977843173891, "rougeLsum_fmeasure": 0.20493355705865743, "rougeLsum_fmeasure_stderr": 0.004011218572127487, "rougeLsum_precision": 0.19295820334137398, "rougeLsum_precision_stderr": 0.005149923293184489, "rougeLsum_recall": 0.3532599821115898, "rougeLsum_recall_stderr": 0.004685486372918684}}, "5": {"PALM_prompt": {"bleu": 1.1738991703843653, "bleu_stderr": 0.05137420728965795, "rouge1_fmeasure": 0.2452749113827306, "rouge1_fmeasure_stderr": 0.004866057995099286, "rouge1_precision": 0.23842752486609714, "rouge1_precision_stderr": 0.00616558462817229, "rouge1_recall": 0.39104608539227964, "rouge1_recall_stderr": 0.005079097315439687, "rouge2_fmeasure": 0.13673599319945717, "rouge2_fmeasure_stderr": 0.003545382189555846, "rouge2_precision": 0.13743673376990653, "rouge2_precision_stderr": 0.004448566773563913, "rouge2_recall": 0.21617363071605727, "rouge2_recall_stderr": 0.004065117072186819, "rougeL_fmeasure": 0.2145149869812429, "rougeL_fmeasure_stderr": 0.004135695136449003, "rougeL_precision": 0.20669362004199143, "rougeL_precision_stderr": 0.0053303444381744315, "rougeL_recall": 0.35345362943589836, "rougeL_recall_stderr": 0.004581784867877382, "rougeLsum_fmeasure": 0.22169261840373009, "rougeLsum_fmeasure_stderr": 0.004292938565416988, "rougeLsum_precision": 0.21482050441032427, "rougeLsum_precision_stderr": 0.005549487778372521, "rougeLsum_recall": 0.3612051449037077, "rougeLsum_recall_stderr": 0.004657096205531439}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 3.2204812581094187, "bleu_stderr": 0.0968937530189579, "rouge1_fmeasure": 0.17281704832161807, "rouge1_fmeasure_stderr": 0.0025639705499622615, "rouge1_precision": 0.16222110345712215, "rouge1_precision_stderr": 0.002918181626000938, "rouge1_recall": 0.23556142979563985, "rouge1_recall_stderr": 0.0035092798940514463, "rouge2_fmeasure": 0.04445750772336212, "rouge2_fmeasure_stderr": 0.0010694173040695087, "rouge2_precision": 0.04035916262517482, "rouge2_precision_stderr": 0.0011089852877097363, "rouge2_recall": 0.06187933259063034, "rouge2_recall_stderr": 0.0015927286355937283, "rougeL_fmeasure": 0.12828595447707558, "rougeL_fmeasure_stderr": 0.0018630698897748783, "rougeL_precision": 0.12115800294799915, "rougeL_precision_stderr": 0.0023302786580353405, "rougeL_recall": 0.1793437869920672, "rougeL_recall_stderr": 0.0027904364481447434, "rougeLsum_fmeasure": 0.16125234602130137, "rougeLsum_fmeasure_stderr": 0.0024054029356366125, "rougeLsum_precision": 0.15193645088089489, "rougeLsum_precision_stderr": 0.002794596188541928, "rougeLsum_recall": 0.22017606445792967, "rougeLsum_recall_stderr": 0.003307741344782461}}, "1": {"tldr_en": {"bleu": 3.030764799858383, "bleu_stderr": 0.10180137949258324, "rouge1_fmeasure": 0.20057722026752264, "rouge1_fmeasure_stderr": 0.00237727127672953, "rouge1_precision": 0.24835405674131716, "rouge1_precision_stderr": 0.003595946507957674, "rouge1_recall": 0.22065222520601965, "rouge1_recall_stderr": 0.0030326234032250735, "rouge2_fmeasure": 0.053780768787129375, "rouge2_fmeasure_stderr": 0.0012652221510456923, "rouge2_precision": 0.07072572329707479, "rouge2_precision_stderr": 0.002023483136430399, "rouge2_recall": 0.05888749376061464, "rouge2_recall_stderr": 0.0015271270172799948, "rougeL_fmeasure": 0.15099195793433165, "rougeL_fmeasure_stderr": 0.0017939149386485946, "rougeL_precision": 0.18962847615836217, "rougeL_precision_stderr": 0.0029056148560385174, "rougeL_recall": 0.16669593752772216, "rougeL_recall_stderr": 0.0023452388157941375, "rougeLsum_fmeasure": 0.18619742012806825, "rougeLsum_fmeasure_stderr": 0.0022080861119325576, "rougeLsum_precision": 0.23119707647225618, "rougeLsum_precision_stderr": 0.0034029730598757074, "rougeLsum_recall": 0.20514467867088854, "rougeLsum_recall_stderr": 0.0028358663517956315}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 1.8080075016885704, "bleu_stderr": 0.061027545228237855, "rouge1_fmeasure": 0.17861979049522314, "rouge1_fmeasure_stderr": 0.0018002125016461491, "rouge1_precision": 0.1356910382997071, "rouge1_precision_stderr": 0.0015410643240858764, "rouge1_recall": 0.2778453886224831, "rouge1_recall_stderr": 0.0023539268248121705, "rouge2_fmeasure": 0.046215425350075, "rouge2_fmeasure_stderr": 0.0010566397123776003, "rouge2_precision": 0.03490809623131593, "rouge2_precision_stderr": 0.0008357898041576343, "rouge2_recall": 0.07284634942140401, "rouge2_recall_stderr": 0.0015701168954429102, "rougeL_fmeasure": 0.16201597249905292, "rougeL_fmeasure_stderr": 0.0013971090679042123, "rougeL_precision": 0.12227403244327856, "rougeL_precision_stderr": 0.0011855454993101654, "rougeL_recall": 0.2551033251187225, "rougeL_recall_stderr": 0.0019031145709281366, "rougeLsum_fmeasure": 0.14908466648922475, "rougeLsum_fmeasure_stderr": 0.0016626826909044133, "rougeLsum_precision": 0.113242028542405, "rougeLsum_precision_stderr": 0.0013998996791185847, "rougeLsum_recall": 0.23203443734017606, "rougeLsum_recall_stderr": 0.0022390418934348437}}, "1": {"generate_text_restaurant": {"bleu": 12.173849341913149, "bleu_stderr": 0.0669092468478733, "rouge1_fmeasure": 0.48129644782721304, "rouge1_fmeasure_stderr": 0.0023219173855042303, "rouge1_precision": 0.5970385739901486, "rouge1_precision_stderr": 0.003272991717133695, "rouge1_recall": 0.44205108840831364, "rouge1_recall_stderr": 0.002990943407358534, "rouge2_fmeasure": 0.23032000484043905, "rouge2_fmeasure_stderr": 0.0021147211593944798, "rouge2_precision": 0.2911262146867607, "rouge2_precision_stderr": 0.002892523328423528, "rouge2_recall": 0.2107609477318019, "rouge2_recall_stderr": 0.0022166981158979714, "rougeL_fmeasure": 0.34966965256911114, "rougeL_fmeasure_stderr": 0.002108342891501849, "rougeL_precision": 0.4377488624210833, "rougeL_precision_stderr": 0.003110832463080634, "rougeL_recall": 0.3198170788492075, "rougeL_recall_stderr": 0.002444190246186975, "rougeLsum_fmeasure": 0.39331173897680705, "rougeLsum_fmeasure_stderr": 0.0023364505709058668, "rougeLsum_precision": 0.48957738460024036, "rougeLsum_precision_stderr": 0.00327157474691632, "rougeLsum_recall": 0.36068779636155734, "rougeLsum_recall_stderr": 0.0027524175233159713}}, "2": {"generate_text_restaurant": {"bleu": 14.360624153571306, "bleu_stderr": 0.15724700369597677, "rouge1_fmeasure": 0.5041317140273615, "rouge1_fmeasure_stderr": 0.0022753134233410278, "rouge1_precision": 0.6032331597687249, "rouge1_precision_stderr": 0.003142877448057622, "rouge1_recall": 0.4697575589134947, "rouge1_recall_stderr": 0.0029526957130554953, "rouge2_fmeasure": 0.25374280478792693, "rouge2_fmeasure_stderr": 0.002169411661246531, "rouge2_precision": 0.30851618494266825, "rouge2_precision_stderr": 0.002855313490834544, "rouge2_recall": 0.23616858770973606, "rouge2_recall_stderr": 0.002325964607821345, "rougeL_fmeasure": 0.3721296496966484, "rougeL_fmeasure_stderr": 0.002164018647000424, "rougeL_precision": 0.4477614821909179, "rougeL_precision_stderr": 0.003011118677636196, "rougeL_recall": 0.3459816794847227, "rougeL_recall_stderr": 0.002532543665969986, "rougeLsum_fmeasure": 0.42160904040581204, "rougeLsum_fmeasure_stderr": 0.002384317338752149, "rougeLsum_precision": 0.5054563233222107, "rougeLsum_precision_stderr": 0.0032185989379280733, "rougeLsum_recall": 0.39233324008569126, "rougeLsum_recall_stderr": 0.0027964602331100393}}, "3": {"generate_text_restaurant": {"bleu": 15.173778916293744, "bleu_stderr": 0.24020125390484678, "rouge1_fmeasure": 0.5122282123885756, "rouge1_fmeasure_stderr": 0.0022794016747342454, "rouge1_precision": 0.6038782195503243, "rouge1_precision_stderr": 0.003130218028564903, "rouge1_recall": 0.4797961783746489, "rouge1_recall_stderr": 0.0029264432136497623, "rouge2_fmeasure": 0.2611392423531194, "rouge2_fmeasure_stderr": 0.0021928684064362373, "rouge2_precision": 0.31128306325561933, "rouge2_precision_stderr": 0.0028044649859898306, "rouge2_recall": 0.2447494516430458, "rouge2_recall_stderr": 0.002368198668181156, "rougeL_fmeasure": 0.37928627551530325, "rougeL_fmeasure_stderr": 0.0021871071072142663, "rougeL_precision": 0.44868202075612884, "rougeL_precision_stderr": 0.0029681578589764264, "rougeL_recall": 0.35482043982343436, "rougeL_recall_stderr": 0.002532913929369527, "rougeLsum_fmeasure": 0.43123333798993546, "rougeLsum_fmeasure_stderr": 0.002401597688343299, "rougeLsum_precision": 0.5087702457406414, "rougeLsum_precision_stderr": 0.0031818356512290486, "rougeLsum_recall": 0.4036850753818513, "rougeLsum_recall_stderr": 0.0028061971662930287}}, "4": {"generate_text_restaurant": {"bleu": 15.78836334652692, "bleu_stderr": 0.16277087917874616, "rouge1_fmeasure": 0.5201963806927633, "rouge1_fmeasure_stderr": 0.0022664890545995124, "rouge1_precision": 0.6052306848983445, "rouge1_precision_stderr": 0.0031205758451821283, "rouge1_recall": 0.49015291142822803, "rouge1_recall_stderr": 0.002870806275113502, "rouge2_fmeasure": 0.2653610425045864, "rouge2_fmeasure_stderr": 0.0021838284720614534, "rouge2_precision": 0.31194428367362853, "rouge2_precision_stderr": 0.0027609843407215874, "rouge2_recall": 0.2500276639929066, "rouge2_recall_stderr": 0.0023425058959290804, "rougeL_fmeasure": 0.3838642484464721, "rougeL_fmeasure_stderr": 0.002185515405072229, "rougeL_precision": 0.4475978408946653, "rougeL_precision_stderr": 0.002901824428209634, "rougeL_recall": 0.36147111146407906, "rougeL_recall_stderr": 0.002523200720958866, "rougeLsum_fmeasure": 0.43919378367441203, "rougeLsum_fmeasure_stderr": 0.002408659068024605, "rougeLsum_precision": 0.5110579537103325, "rougeLsum_precision_stderr": 0.0031404148777386892, "rougeLsum_recall": 0.4135967411759738, "rougeLsum_recall_stderr": 0.0027946622087117543}}, "5": {"generate_text_restaurant": {"bleu": 15.879323420491742, "bleu_stderr": 0.1522927233333457, "rouge1_fmeasure": 0.5216373530710218, "rouge1_fmeasure_stderr": 0.002262224044659468, "rouge1_precision": 0.6064323245894362, "rouge1_precision_stderr": 0.00315510278665659, "rouge1_recall": 0.49013366730559393, "rouge1_recall_stderr": 0.0028136604439425025, "rouge2_fmeasure": 0.26786622625063644, "rouge2_fmeasure_stderr": 0.002208434520877025, "rouge2_precision": 0.3150817079641561, "rouge2_precision_stderr": 0.002829192112850875, "rouge2_recall": 0.25132514912770915, "rouge2_recall_stderr": 0.002318826430015561, "rougeL_fmeasure": 0.38681699896646954, "rougeL_fmeasure_stderr": 0.002220989687079745, "rougeL_precision": 0.45023806138186195, "rougeL_precision_stderr": 0.002949168521598567, "rougeL_recall": 0.36355539000425124, "rougeL_recall_stderr": 0.002526510160020316, "rougeLsum_fmeasure": 0.4417889417099761, "rougeLsum_fmeasure_stderr": 0.0024158193931717187, "rougeLsum_precision": 0.5137337228447252, "rougeLsum_precision_stderr": 0.0031936836223124105, "rougeLsum_recall": 0.41496788459604567, "rougeLsum_recall_stderr": 0.0027605438893900454}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.9472662234201847, "bleu_stderr": 0.0954010664780363, "rouge1_fmeasure": 0.20062931818668506, "rouge1_fmeasure_stderr": 0.002892087092668822, "rouge1_precision": 0.1512189693389312, "rouge1_precision_stderr": 0.002590198483449934, "rouge1_recall": 0.32951007687075756, "rouge1_recall_stderr": 0.004923756202298708, "rouge2_fmeasure": 0.044133865209903714, "rouge2_fmeasure_stderr": 0.0015693045278532822, "rouge2_precision": 0.03240083882273609, "rouge2_precision_stderr": 0.0011887319293568278, "rouge2_recall": 0.07461053739480651, "rouge2_recall_stderr": 0.0027791525130900266, "rougeL_fmeasure": 0.14533977808404885, "rougeL_fmeasure_stderr": 0.0021630231020242576, "rougeL_precision": 0.11056422701824653, "rougeL_precision_stderr": 0.0021853162208514175, "rougeL_recall": 0.23921769394978765, "rougeL_recall_stderr": 0.003783594428094317, "rougeLsum_fmeasure": 0.15912733837926105, "rougeLsum_fmeasure_stderr": 0.0023937408312475765, "rougeLsum_precision": 0.12055829236568064, "rougeLsum_precision_stderr": 0.002297890666943901, "rougeLsum_recall": 0.2623026232832005, "rougeLsum_recall_stderr": 0.004182995633448934}}, "1": {"article_DOC_summary": {"bleu": 2.857997728240847, "bleu_stderr": 0.15132505328438867, "rouge1_fmeasure": 0.24058051563117627, "rouge1_fmeasure_stderr": 0.003619950901783304, "rouge1_precision": 0.2431489069099882, "rouge1_precision_stderr": 0.004319149380207122, "rouge1_recall": 0.27274551008869324, "rouge1_recall_stderr": 0.004181125297952178, "rouge2_fmeasure": 0.05891708042714147, "rouge2_fmeasure_stderr": 0.002369248568269019, "rouge2_precision": 0.06156338993755893, "rouge2_precision_stderr": 0.0027090151794028584, "rouge2_recall": 0.06564279411701872, "rouge2_recall_stderr": 0.0026141410795920464, "rougeL_fmeasure": 0.1845786738464429, "rougeL_fmeasure_stderr": 0.0030093215424524295, "rougeL_precision": 0.18703509762652787, "rougeL_precision_stderr": 0.0036036431129194833, "rougeL_recall": 0.20956010556672522, "rougeL_recall_stderr": 0.00345405751329193, "rougeLsum_fmeasure": 0.18768186260751757, "rougeLsum_fmeasure_stderr": 0.003017598467168456, "rougeLsum_precision": 0.18954846036997042, "rougeLsum_precision_stderr": 0.0035941447605698394, "rougeLsum_recall": 0.21418956311713871, "rougeLsum_recall_stderr": 0.0035468160066617596}}, "2": {"article_DOC_summary": {"bleu": 3.19195992073562, "bleu_stderr": 0.2067955639958893, "rouge1_fmeasure": 0.24657160673903905, "rouge1_fmeasure_stderr": 0.0037739176215048444, "rouge1_precision": 0.25234682823435783, "rouge1_precision_stderr": 0.004406932928762655, "rouge1_recall": 0.26739840698638306, "rouge1_recall_stderr": 0.0039999072862688684, "rouge2_fmeasure": 0.06271701269177109, "rouge2_fmeasure_stderr": 0.0025663699767628305, "rouge2_precision": 0.06567480327233229, "rouge2_precision_stderr": 0.0027842377535723913, "rouge2_recall": 0.06599412859644187, "rouge2_recall_stderr": 0.0026775951767211374, "rougeL_fmeasure": 0.1876781101224112, "rougeL_fmeasure_stderr": 0.0031437463539169125, "rougeL_precision": 0.1921361411782326, "rougeL_precision_stderr": 0.0036263536814562453, "rougeL_recall": 0.20386135964058816, "rougeL_recall_stderr": 0.0033147209011893724, "rougeLsum_fmeasure": 0.1896272533115015, "rougeLsum_fmeasure_stderr": 0.0031550558124475133, "rougeLsum_precision": 0.19374913452852363, "rougeLsum_precision_stderr": 0.0036251531161871544, "rougeLsum_recall": 0.20676693183261305, "rougeLsum_recall_stderr": 0.0034014354284824795}}}} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_0.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..1df9ab49557c843eaa89dc58a8fca29b5185f9e7 --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.33618386090404295, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.043286547374004225 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07608115633976532, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0028424335866037475 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.243734587530279, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005032751672173048 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.09550360928926843, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0021611192824620468 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03391274645846755, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0017782441786429572 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11477361563470867, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0030177112931945443 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04353421604632926, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013022741040944032 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07249954185930807, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002716866763111571 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.23447583587320983, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004820896551192642 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.0908905716888711, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0019748576875776485 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07260565563718514, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0027622865524293628 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2312007323793673, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004666750865618609 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09063319866429098, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002018782468480028 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_1.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..bd21cf4f6c622481225f49b9717f239b154dce0b --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5152510207869508, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.039697768768641464 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1335251141437586, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004421796872864802 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3040669240102272, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0049926465687368735 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.15419793855600986, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0037752055082234935 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.06857339375782437, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0030273264083127568 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1555986112064758, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036341014671041087 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.07820906828691397, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0026222161094111586 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.1195649771956543, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0038518942294089972 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2838951533263151, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004599064364517073 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.13965714245032726, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0032487392690607572 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.12140487798820795, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003915984273012587 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2857833042522088, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004601461544101827 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.14150307262693815, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0033007395324502467 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_2.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..59bbb0e618f7d1aad0779a4123beaaa1e95cb482 --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6450721424031474, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.035938592978876936 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.17715496451419446, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005377686826508908 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3442204927205235, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00499209962075588 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.19228537050298922, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004356183491682661 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.09659406582034752, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0036720254666308344 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1816245156374427, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038421174433974025 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.1017490401630499, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003080557280075834 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.15519367504713033, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004580706449804959 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.31893881029765586, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004597766706728441 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.17158392384169643, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0037128302671958994 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.1592800915810083, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0047149524911017215 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3221825821541532, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0046252310161258746 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.17498254398589475, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0037985612156152086 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_3.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..0da7923ca522cffb7cedea9300b0214712cedb75 --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.8785043636862591, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02652000083973547 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.2002191357399255, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005700191155087746 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3622650735119951, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005105318033672305 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.21217682060449367, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004581243352642801 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.10955905558045385, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0038849982073218873 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19262377036723086, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003902442560309681 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.11312048852329888, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003186877123824252 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.1744946205047383, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004899868234689971 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.33190561350734876, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004628476785750535 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1874319081280966, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0038899168243038715 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.17972186968155374, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.005058207025529124 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.33723235220496645, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0046889691038068775 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.19207381785134825, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.004003703743860644 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_4.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..d4a7df7e0881a902d135c6fb4b3fd1fc2cfa9dfd --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.020225734756704, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06946466420275214 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.21447559212644274, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005787602630220149 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3797811786576114, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005078572769442694 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.22615455778377724, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004584303113870005 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.11802182161980528, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.003954053081043237 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20495230642568182, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003956396099130858 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.12153309984630654, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0032009564132827184 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.18574729294363898, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.00493965653212434 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.34661430398431914, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004643977843173891 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1985084531863174, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003863020108912202 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.19295820334137398, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.005149923293184489 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3532599821115898, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004685486372918684 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.20493355705865743, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.004011218572127487 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_5.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..77472f1318e983af416ebd801d407f16bbab0496 --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.1738991703843653, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05137420728965795 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.23842752486609714, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.00616558462817229 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.39104608539227964, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005079097315439687 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.2452749113827306, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004866057995099286 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.13743673376990653, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.004448566773563913 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21617363071605727, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.004065117072186819 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.13673599319945717, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.003545382189555846 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.20669362004199143, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0053303444381744315 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.35345362943589836, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004581784867877382 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.2145149869812429, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.004135695136449003 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.21482050441032427, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.005549487778372521 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3612051449037077, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004657096205531439 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.22169261840373009, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.004292938565416988 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-wiki_lingua_en_tldr_en_0.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..0b77d2da90675cf88274d257c6c46f77f682493a --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.16222110345712215, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002918181626000938 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.23556142979563985, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0035092798940514463 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17281704832161807, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0025639705499622615 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04035916262517482, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011089852877097363 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06187933259063034, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015927286355937283 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04445750772336212, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010694173040695087 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.12115800294799915, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0023302786580353405 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1793437869920672, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0027904364481447434 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12828595447707558, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018630698897748783 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.15193645088089489, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002794596188541928 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.22017606445792967, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.003307741344782461 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16125234602130137, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024054029356366125 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.2204812581094187, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0968937530189579 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-wiki_lingua_en_tldr_en_1.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..216776f42321642f1ae7590f989d96a1e70eb230 --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.24835405674131716, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.003595946507957674 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.22065222520601965, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0030326234032250735 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.20057722026752264, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00237727127672953 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.07072572329707479, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.002023483136430399 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05888749376061464, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015271270172799948 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.053780768787129375, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012652221510456923 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.18962847615836217, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0029056148560385174 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.16669593752772216, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0023452388157941375 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15099195793433165, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017939149386485946 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.23119707647225618, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0034029730598757074 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.20514467867088854, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0028358663517956315 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.18619742012806825, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0022080861119325576 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.030764799858383, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.10180137949258324 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_0.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..62be1d27f4fabbb54ce6ad71f2d975b126c5d6a1 --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 1.8080075016885704, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.061027545228237855 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.1356910382997071, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0015410643240858764 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.2778453886224831, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0023539268248121705 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.17861979049522314, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018002125016461491 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.03490809623131593, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0008357898041576343 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.07284634942140401, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0015701168954429102 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.046215425350075, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0010566397123776003 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.12227403244327856, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0011855454993101654 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.2551033251187225, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0019031145709281366 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.16201597249905292, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0013971090679042123 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.113242028542405, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0013998996791185847 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.23203443734017606, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0022390418934348437 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.14908466648922475, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016626826909044133 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_1.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..18574c404751793f6e2ec2a98ad4d29ca19525f3 --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 12.173849341913149, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.0669092468478733 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5970385739901486, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003272991717133695 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.44205108840831364, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002990943407358534 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.48129644782721304, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0023219173855042303 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2911262146867607, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002892523328423528 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2107609477318019, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0022166981158979714 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.23032000484043905, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021147211593944798 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4377488624210833, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.003110832463080634 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3198170788492075, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002444190246186975 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.34966965256911114, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002108342891501849 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.48957738460024036, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.00327157474691632 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.36068779636155734, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027524175233159713 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.39331173897680705, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023364505709058668 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_2.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..97b7313d95b7a27d9904f061cfb4968f356c46e9 --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.360624153571306, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.15724700369597677 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6032331597687249, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003142877448057622 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4697575589134947, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029526957130554953 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5041317140273615, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022753134233410278 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.30851618494266825, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002855313490834544 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.23616858770973606, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002325964607821345 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.25374280478792693, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002169411661246531 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4477614821909179, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.003011118677636196 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3459816794847227, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002532543665969986 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3721296496966484, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002164018647000424 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5054563233222107, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0032185989379280733 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.39233324008569126, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027964602331100393 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.42160904040581204, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002384317338752149 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_3.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..9bdcba7882e0bf3c8207c0d897f38e5930b9578f --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.173778916293744, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.24020125390484678 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6038782195503243, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003130218028564903 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4797961783746489, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029264432136497623 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5122282123885756, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022794016747342454 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.31128306325561933, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0028044649859898306 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2447494516430458, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002368198668181156 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2611392423531194, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021928684064362373 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.44868202075612884, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029681578589764264 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.35482043982343436, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002532913929369527 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.37928627551530325, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0021871071072142663 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5087702457406414, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031818356512290486 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4036850753818513, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0028061971662930287 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.43123333798993546, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002401597688343299 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_4.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..9d048e1f2605aea1ef5a337ba59806d284701f85 --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.78836334652692, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.16277087917874616 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6052306848983445, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031205758451821283 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.49015291142822803, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002870806275113502 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5201963806927633, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022664890545995124 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.31194428367362853, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027609843407215874 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2500276639929066, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023425058959290804 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2653610425045864, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021838284720614534 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4475978408946653, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002901824428209634 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.36147111146407906, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002523200720958866 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3838642484464721, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002185515405072229 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5110579537103325, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031404148777386892 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4135967411759738, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027946622087117543 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.43919378367441203, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002408659068024605 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_5.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..a1585f80b3aa6187cdc65c26ec975ad8f8c7cb5e --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 15.879323420491742, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1522927233333457 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6064323245894362, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.00315510278665659 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.49013366730559393, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028136604439425025 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5216373530710218, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002262224044659468 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3150817079641561, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002829192112850875 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.25132514912770915, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002318826430015561 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.26786622625063644, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002208434520877025 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.45023806138186195, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002949168521598567 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.36355539000425124, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002526510160020316 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.38681699896646954, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002220989687079745 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5137337228447252, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031936836223124105 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.41496788459604567, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0027605438893900454 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4417889417099761, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024158193931717187 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_gem_xsum_article_DOC_summary_0.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..69d4cb6b0992d74e1aac6255c8b67e32c48913ac --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1512189693389312, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002590198483449934 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.32951007687075756, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004923756202298708 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20062931818668506, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002892087092668822 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03240083882273609, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0011887319293568278 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07461053739480651, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0027791525130900266 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.044133865209903714, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0015693045278532822 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.11056422701824653, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0021853162208514175 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23921769394978765, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003783594428094317 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14533977808404885, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0021630231020242576 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.12055829236568064, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.002297890666943901 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2623026232832005, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.004182995633448934 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.15912733837926105, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0023937408312475765 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.9472662234201847, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0954010664780363 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_gem_xsum_article_DOC_summary_1.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1185f3526252e68ac6353d5229e710f7e51741b1 --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.2431489069099882, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004319149380207122 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.27274551008869324, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004181125297952178 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.24058051563117627, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003619950901783304 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.06156338993755893, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0027090151794028584 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06564279411701872, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026141410795920464 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.05891708042714147, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.002369248568269019 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.18703509762652787, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0036036431129194833 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.20956010556672522, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.00345405751329193 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1845786738464429, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0030093215424524295 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.18954846036997042, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0035941447605698394 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.21418956311713871, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0035468160066617596 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.18768186260751757, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.003017598467168456 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.857997728240847, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.15132505328438867 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/generation/slim.8b7178b25b_gem_xsum_article_DOC_summary_2.json b/8b7178b25b/evaluation/generation/slim.8b7178b25b_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d65b07bb7cc406ca24c2312fde52b397bc621673 --- /dev/null +++ b/8b7178b25b/evaluation/generation/slim.8b7178b25b_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.25234682823435783, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.004406932928762655 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.26739840698638306, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0039999072862688684 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.24657160673903905, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0037739176215048444 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.06567480327233229, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0027842377535723913 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06599412859644187, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026775951767211374 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.06271701269177109, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0025663699767628305 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1921361411782326, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0036263536814562453 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.20386135964058816, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033147209011893724 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1876781101224112, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0031437463539169125 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.19374913452852363, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0036251531161871544 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.20676693183261305, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0034014354284824795 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1896272533115015, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0031550558124475133 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 3.19195992073562, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.2067955639958893 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-8b7-178b-oscar-repetitions/8b7178b25b/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/rankeval/8b7178b25b_0.csv b/8b7178b25b/evaluation/rankeval/8b7178b25b_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..c33ac0cf5ac8b489f4928d9d0b9d4657f159bcea --- /dev/null +++ b/8b7178b25b/evaluation/rankeval/8b7178b25b_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.338,0.014965960710224482,0 +anli_r2,acc,0.34,0.014987482264363937,0 +anli_r3,acc,0.3458333333333333,0.013736245342311012,0 +arc_challenge,acc,0.26706484641638223,0.012928933196496354,0 +arc_challenge,acc_norm,0.28668941979522183,0.013214986329274776,0 +arc_easy,acc,0.5955387205387206,0.010070746648278783,0 +arc_easy,acc_norm,0.5378787878787878,0.010230299628864806,0 +boolq,acc,0.5758409785932722,0.008643869023388128,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.2938907552569367,,1 +copa,acc,0.76,0.04292346959909283,0 +hellaswag,acc,0.44523003385779725,0.004959754882055468,0 +hellaswag,acc_norm,0.5769766978689504,0.004930293787545608,0 +piqa,acc,0.7274211099020674,0.010389256803296018,0 +piqa,acc_norm,0.7404787812840044,0.010227939888173923,0 +rte,acc,0.5523465703971119,0.02993107036293953,0 +sciq,acc,0.843,0.011510146979230196,0 +sciq,acc_norm,0.773,0.013253174964763931,0 +storycloze_2016,acc,0.6835916622127205,0.01075478009794089,0 +winogrande,acc,0.5485398579321231,0.013986110301017762,0 diff --git a/8b7178b25b/evaluation/rankeval/8b7178b25b_0.json b/8b7178b25b/evaluation/rankeval/8b7178b25b_0.json new file mode 100644 index 0000000000000000000000000000000000000000..f92b8c89526cad373dcf1b6a0bbba45240fed145 --- /dev/null +++ b/8b7178b25b/evaluation/rankeval/8b7178b25b_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.338, + "acc_stderr": 0.014965960710224482 + }, + "anli_r2": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.013736245342311012 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.2938907552569367 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909283 + }, + "hellaswag": { + "acc": 0.44523003385779725, + "acc_stderr": 0.004959754882055468, + "acc_norm": 0.5769766978689504, + "acc_norm_stderr": 0.004930293787545608 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.02993107036293953 + }, + "winogrande": { + "acc": 0.5485398579321231, + "acc_stderr": 0.013986110301017762 + }, + "storycloze_2016": { + "acc": 0.6835916622127205, + "acc_stderr": 0.01075478009794089 + }, + "boolq": { + "acc": 0.5758409785932722, + "acc_stderr": 0.008643869023388128 + }, + "arc_easy": { + "acc": 0.5955387205387206, + "acc_stderr": 0.010070746648278783, + "acc_norm": 0.5378787878787878, + "acc_norm_stderr": 0.010230299628864806 + }, + "arc_challenge": { + "acc": 0.26706484641638223, + "acc_stderr": 0.012928933196496354, + "acc_norm": 0.28668941979522183, + "acc_norm_stderr": 0.013214986329274776 + }, + "sciq": { + "acc": 0.843, + "acc_stderr": 0.011510146979230196, + "acc_norm": 0.773, + "acc_norm_stderr": 0.013253174964763931 + }, + "piqa": { + "acc": 0.7274211099020674, + "acc_stderr": 0.010389256803296018, + "acc_norm": 0.7404787812840044, + "acc_norm_stderr": 0.010227939888173923 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/rankeval/8b7178b25b_1.csv b/8b7178b25b/evaluation/rankeval/8b7178b25b_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..ea575aef16f825673da56b2aed977a0f69a87893 --- /dev/null +++ b/8b7178b25b/evaluation/rankeval/8b7178b25b_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.352,0.015110404505648661,0 +anli_r2,acc,0.327,0.014842213153411242,0 +anli_r3,acc,0.33,0.013579531277800925,0 +arc_challenge,acc,0.28242320819112626,0.013155456884097222,0 +arc_challenge,acc_norm,0.30716723549488056,0.013481034054980945,0 +arc_easy,acc,0.6262626262626263,0.009927267058259626,0 +arc_easy,acc_norm,0.6123737373737373,0.009997307914447608,0 +boolq,acc,0.5834862385321101,0.008622288020674008,1 +cb,acc,0.5,0.06741998624632421,1 +cb,f1,0.355846042120552,,1 +copa,acc,0.77,0.04229525846816506,0 +hellaswag,acc,0.45130452101175067,0.0049660609953150634,0 +hellaswag,acc_norm,0.5881298546106354,0.0049116598845061485,0 +piqa,acc,0.7377584330794341,0.010262502565172447,0 +piqa,acc_norm,0.7404787812840044,0.010227939888173929,0 +rte,acc,0.5306859205776173,0.030039730592197812,0 +sciq,acc,0.903,0.009363689373248123,0 +sciq,acc_norm,0.891,0.009859828407037186,0 +storycloze_2016,acc,0.6819882415820417,0.010769343495248548,0 +winogrande,acc,0.5493291239147593,0.01398392886904024,0 diff --git a/8b7178b25b/evaluation/rankeval/8b7178b25b_1.json b/8b7178b25b/evaluation/rankeval/8b7178b25b_1.json new file mode 100644 index 0000000000000000000000000000000000000000..695ed76963d86991f5b362f1b1014155dc94aceb --- /dev/null +++ b/8b7178b25b/evaluation/rankeval/8b7178b25b_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.352, + "acc_stderr": 0.015110404505648661 + }, + "anli_r2": { + "acc": 0.327, + "acc_stderr": 0.014842213153411242 + }, + "anli_r3": { + "acc": 0.33, + "acc_stderr": 0.013579531277800925 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.355846042120552 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.45130452101175067, + "acc_stderr": 0.0049660609953150634, + "acc_norm": 0.5881298546106354, + "acc_norm_stderr": 0.0049116598845061485 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.030039730592197812 + }, + "winogrande": { + "acc": 0.5493291239147593, + "acc_stderr": 0.01398392886904024 + }, + "storycloze_2016": { + "acc": 0.6819882415820417, + "acc_stderr": 0.010769343495248548 + }, + "boolq": { + "acc": 0.5834862385321101, + "acc_stderr": 0.008622288020674008 + }, + "arc_easy": { + "acc": 0.6262626262626263, + "acc_stderr": 0.009927267058259626, + "acc_norm": 0.6123737373737373, + "acc_norm_stderr": 0.009997307914447608 + }, + "arc_challenge": { + "acc": 0.28242320819112626, + "acc_stderr": 0.013155456884097222, + "acc_norm": 0.30716723549488056, + "acc_norm_stderr": 0.013481034054980945 + }, + "sciq": { + "acc": 0.903, + "acc_stderr": 0.009363689373248123, + "acc_norm": 0.891, + "acc_norm_stderr": 0.009859828407037186 + }, + "piqa": { + "acc": 0.7377584330794341, + "acc_stderr": 0.010262502565172447, + "acc_norm": 0.7404787812840044, + "acc_norm_stderr": 0.010227939888173929 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/rankeval/8b7178b25b_2.csv b/8b7178b25b/evaluation/rankeval/8b7178b25b_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..c61a413d2af8a2babd0053af2ac882cfc47733fe --- /dev/null +++ b/8b7178b25b/evaluation/rankeval/8b7178b25b_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.325,0.014818724459095524,0 +anli_r2,acc,0.342,0.01500870618212173,0 +anli_r3,acc,0.31666666666666665,0.013434078660827388,0 +arc_challenge,acc,0.2909556313993174,0.013273077865907578,0 +arc_challenge,acc_norm,0.3122866894197952,0.013542598541688067,0 +arc_easy,acc,0.6342592592592593,0.009882988069418822,0 +arc_easy,acc_norm,0.6186868686868687,0.009966542497171021,0 +boolq,acc,0.608868501529052,0.008535239054221166,1 +cb,acc,0.4642857142857143,0.06724777654937658,1 +cb,f1,0.3289760348583877,,1 +copa,acc,0.77,0.04229525846816506,0 +hellaswag,acc,0.45160326628161723,0.004966351835028203,0 +hellaswag,acc_norm,0.5888269269069907,0.004910409150135493,0 +piqa,acc,0.733949945593036,0.010310039263352831,0 +piqa,acc_norm,0.7486398258977149,0.010121156016819243,0 +rte,acc,0.48375451263537905,0.030080573208738064,0 +sciq,acc,0.916,0.008776162089491137,0 +sciq,acc_norm,0.915,0.008823426366942312,0 +storycloze_2016,acc,0.6953500801710315,0.010643426988646796,0 +winogrande,acc,0.5682715074980268,0.01392087211001071,0 diff --git a/8b7178b25b/evaluation/rankeval/8b7178b25b_2.json b/8b7178b25b/evaluation/rankeval/8b7178b25b_2.json new file mode 100644 index 0000000000000000000000000000000000000000..9be8222dfab0cfd7ba13c347b15deb20d60dbd08 --- /dev/null +++ b/8b7178b25b/evaluation/rankeval/8b7178b25b_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.325, + "acc_stderr": 0.014818724459095524 + }, + "anli_r2": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r3": { + "acc": 0.31666666666666665, + "acc_stderr": 0.013434078660827388 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.06724777654937658, + "f1": 0.3289760348583877 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.45160326628161723, + "acc_stderr": 0.004966351835028203, + "acc_norm": 0.5888269269069907, + "acc_norm_stderr": 0.004910409150135493 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5682715074980268, + "acc_stderr": 0.01392087211001071 + }, + "storycloze_2016": { + "acc": 0.6953500801710315, + "acc_stderr": 0.010643426988646796 + }, + "boolq": { + "acc": 0.608868501529052, + "acc_stderr": 0.008535239054221166 + }, + "arc_easy": { + "acc": 0.6342592592592593, + "acc_stderr": 0.009882988069418822, + "acc_norm": 0.6186868686868687, + "acc_norm_stderr": 0.009966542497171021 + }, + "arc_challenge": { + "acc": 0.2909556313993174, + "acc_stderr": 0.013273077865907578, + "acc_norm": 0.3122866894197952, + "acc_norm_stderr": 0.013542598541688067 + }, + "sciq": { + "acc": 0.916, + "acc_stderr": 0.008776162089491137, + "acc_norm": 0.915, + "acc_norm_stderr": 0.008823426366942312 + }, + "piqa": { + "acc": 0.733949945593036, + "acc_stderr": 0.010310039263352831, + "acc_norm": 0.7486398258977149, + "acc_norm_stderr": 0.010121156016819243 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/rankeval/8b7178b25b_3.csv b/8b7178b25b/evaluation/rankeval/8b7178b25b_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..c8392ed5a9cb52992a34d61ac894ddc2d15a7501 --- /dev/null +++ b/8b7178b25b/evaluation/rankeval/8b7178b25b_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.319,0.014746404865473474,0 +anli_r2,acc,0.343,0.015019206922356953,0 +anli_r3,acc,0.3416666666666667,0.013696658778002519,0 +arc_challenge,acc,0.29180887372013653,0.013284525292403503,0 +arc_challenge,acc_norm,0.3174061433447099,0.01360223908803817,0 +arc_easy,acc,0.6452020202020202,0.009817629113069696,0 +arc_easy,acc_norm,0.6363636363636364,0.009870849346011758,0 +boolq,acc,0.6107033639143731,0.00852801629098454,1 +cb,acc,0.5357142857142857,0.06724777654937658,1 +cb,f1,0.3757011576560449,,1 +copa,acc,0.76,0.04292346959909282,0 +hellaswag,acc,0.4500099581756622,0.004964779805180658,0 +hellaswag,acc_norm,0.5928101971718781,0.0049030666397619485,0 +piqa,acc,0.7399347116430903,0.010234893249061303,0 +piqa,acc_norm,0.7513601741022851,0.01008451123429685,0 +rte,acc,0.51985559566787,0.030072723167317177,0 +sciq,acc,0.923,0.008434580140240643,0 +sciq,acc_norm,0.915,0.00882342636694233,0 +storycloze_2016,acc,0.6990913949759487,0.010606289538707334,0 +winogrande,acc,0.5737963693764798,0.013898585965412338,0 diff --git a/8b7178b25b/evaluation/rankeval/8b7178b25b_3.json b/8b7178b25b/evaluation/rankeval/8b7178b25b_3.json new file mode 100644 index 0000000000000000000000000000000000000000..9cf8ef119fbf65a64d58f26b9b5e71c59b8a429e --- /dev/null +++ b/8b7178b25b/evaluation/rankeval/8b7178b25b_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.319, + "acc_stderr": 0.014746404865473474 + }, + "anli_r2": { + "acc": 0.343, + "acc_stderr": 0.015019206922356953 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002519 + }, + "cb": { + "acc": 0.5357142857142857, + "acc_stderr": 0.06724777654937658, + "f1": 0.3757011576560449 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909282 + }, + "hellaswag": { + "acc": 0.4500099581756622, + "acc_stderr": 0.004964779805180658, + "acc_norm": 0.5928101971718781, + "acc_norm_stderr": 0.0049030666397619485 + }, + "rte": { + "acc": 0.51985559566787, + "acc_stderr": 0.030072723167317177 + }, + "winogrande": { + "acc": 0.5737963693764798, + "acc_stderr": 0.013898585965412338 + }, + "storycloze_2016": { + "acc": 0.6990913949759487, + "acc_stderr": 0.010606289538707334 + }, + "boolq": { + "acc": 0.6107033639143731, + "acc_stderr": 0.00852801629098454 + }, + "arc_easy": { + "acc": 0.6452020202020202, + "acc_stderr": 0.009817629113069696, + "acc_norm": 0.6363636363636364, + "acc_norm_stderr": 0.009870849346011758 + }, + "arc_challenge": { + "acc": 0.29180887372013653, + "acc_stderr": 0.013284525292403503, + "acc_norm": 0.3174061433447099, + "acc_norm_stderr": 0.01360223908803817 + }, + "sciq": { + "acc": 0.923, + "acc_stderr": 0.008434580140240643, + "acc_norm": 0.915, + "acc_norm_stderr": 0.00882342636694233 + }, + "piqa": { + "acc": 0.7399347116430903, + "acc_stderr": 0.010234893249061303, + "acc_norm": 0.7513601741022851, + "acc_norm_stderr": 0.01008451123429685 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/rankeval/8b7178b25b_4.csv b/8b7178b25b/evaluation/rankeval/8b7178b25b_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..8375fa456448c7b9ebc691c573caeeb71452c9af --- /dev/null +++ b/8b7178b25b/evaluation/rankeval/8b7178b25b_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.325,0.014818724459095526,0 +anli_r2,acc,0.33,0.014876872027456738,0 +anli_r3,acc,0.32666666666666666,0.013544340907003663,0 +arc_challenge,acc,0.28754266211604096,0.013226719056266129,0 +arc_challenge,acc_norm,0.3250853242320819,0.013688147309729122,0 +arc_easy,acc,0.6376262626262627,0.009863468202583775,0 +arc_easy,acc_norm,0.6338383838383839,0.009885391390947709,0 +boolq,acc,0.6253822629969419,0.008465633983431928,1 +cb,acc,0.5714285714285714,0.06672848092813058,1 +cb,f1,0.42867867867867865,,1 +copa,acc,0.77,0.042295258468165065,0 +hellaswag,acc,0.4495120493925513,0.004964277999318813,0 +hellaswag,acc_norm,0.5978888667596096,0.004893220635011786,0 +piqa,acc,0.7383025027203483,0.010255630772708227,0 +piqa,acc_norm,0.735038084874864,0.010296557993316047,0 +rte,acc,0.5234657039711191,0.030063300411902652,0 +sciq,acc,0.926,0.008282064512704159,0 +sciq,acc_norm,0.927,0.008230354715244066,0 +storycloze_2016,acc,0.6985569214323891,0.010611646032767584,0 +winogrande,acc,0.5722178374112076,0.013905134013839951,0 diff --git a/8b7178b25b/evaluation/rankeval/8b7178b25b_4.json b/8b7178b25b/evaluation/rankeval/8b7178b25b_4.json new file mode 100644 index 0000000000000000000000000000000000000000..5eb375a5be10ac467d3a7bea072702b14ac2e7ab --- /dev/null +++ b/8b7178b25b/evaluation/rankeval/8b7178b25b_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.325, + "acc_stderr": 0.014818724459095526 + }, + "anli_r2": { + "acc": 0.33, + "acc_stderr": 0.014876872027456738 + }, + "anli_r3": { + "acc": 0.32666666666666666, + "acc_stderr": 0.013544340907003663 + }, + "cb": { + "acc": 0.5714285714285714, + "acc_stderr": 0.06672848092813058, + "f1": 0.42867867867867865 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.042295258468165065 + }, + "hellaswag": { + "acc": 0.4495120493925513, + "acc_stderr": 0.004964277999318813, + "acc_norm": 0.5978888667596096, + "acc_norm_stderr": 0.004893220635011786 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.030063300411902652 + }, + "winogrande": { + "acc": 0.5722178374112076, + "acc_stderr": 0.013905134013839951 + }, + "storycloze_2016": { + "acc": 0.6985569214323891, + "acc_stderr": 0.010611646032767584 + }, + "boolq": { + "acc": 0.6253822629969419, + "acc_stderr": 0.008465633983431928 + }, + "arc_easy": { + "acc": 0.6376262626262627, + "acc_stderr": 0.009863468202583775, + "acc_norm": 0.6338383838383839, + "acc_norm_stderr": 0.009885391390947709 + }, + "arc_challenge": { + "acc": 0.28754266211604096, + "acc_stderr": 0.013226719056266129, + "acc_norm": 0.3250853242320819, + "acc_norm_stderr": 0.013688147309729122 + }, + "sciq": { + "acc": 0.926, + "acc_stderr": 0.008282064512704159, + "acc_norm": 0.927, + "acc_norm_stderr": 0.008230354715244066 + }, + "piqa": { + "acc": 0.7383025027203483, + "acc_stderr": 0.010255630772708227, + "acc_norm": 0.735038084874864, + "acc_norm_stderr": 0.010296557993316047 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b25b/evaluation/rankeval/8b7178b25b_5.csv b/8b7178b25b/evaluation/rankeval/8b7178b25b_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..bcbfc6c791da1cbf884428d27dc4572e7107158e --- /dev/null +++ b/8b7178b25b/evaluation/rankeval/8b7178b25b_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.327,0.014842213153411244,0 +anli_r2,acc,0.327,0.014842213153411245,0 +anli_r3,acc,0.32166666666666666,0.013490095282989521,0 +arc_challenge,acc,0.295221843003413,0.013329750293382318,0 +arc_challenge,acc_norm,0.32849829351535836,0.013724978465537378,0 +arc_easy,acc,0.6452020202020202,0.009817629113069696,0 +arc_easy,acc_norm,0.6388888888888888,0.00985601342581124,0 +boolq,acc,0.618960244648318,0.00849393752443934,1 +cb,acc,0.5178571428571429,0.06737697508644647,1 +cb,f1,0.32323232323232315,,1 +copa,acc,0.77,0.04229525846816505,0 +hellaswag,acc,0.45210117506472813,0.004966832553245033,0 +hellaswag,acc_norm,0.5958972316271659,0.004897146690596266,0 +piqa,acc,0.7399347116430903,0.010234893249061301,0 +piqa,acc_norm,0.7453754080522307,0.0101644322370605,0 +rte,acc,0.48736462093862815,0.030086851767188564,0 +sciq,acc,0.922,0.008484573530118585,0 +sciq,acc_norm,0.924,0.008384169266796387,0 +storycloze_2016,acc,0.6974879743452699,0.010622307774396942,0 +winogrande,acc,0.5714285714285714,0.013908353814606696,0 diff --git a/8b7178b25b/evaluation/rankeval/8b7178b25b_5.json b/8b7178b25b/evaluation/rankeval/8b7178b25b_5.json new file mode 100644 index 0000000000000000000000000000000000000000..1c4f0b8a2e7d5872f3e90de1e36d9338533a0758 --- /dev/null +++ b/8b7178b25b/evaluation/rankeval/8b7178b25b_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.327, + "acc_stderr": 0.014842213153411244 + }, + "anli_r2": { + "acc": 0.327, + "acc_stderr": 0.014842213153411245 + }, + "anli_r3": { + "acc": 0.32166666666666666, + "acc_stderr": 0.013490095282989521 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.32323232323232315 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816505 + }, + "hellaswag": { + "acc": 0.45210117506472813, + "acc_stderr": 0.004966832553245033, + "acc_norm": 0.5958972316271659, + "acc_norm_stderr": 0.004897146690596266 + }, + "rte": { + "acc": 0.48736462093862815, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5714285714285714, + "acc_stderr": 0.013908353814606696 + }, + "storycloze_2016": { + "acc": 0.6974879743452699, + "acc_stderr": 0.010622307774396942 + }, + "boolq": { + "acc": 0.618960244648318, + "acc_stderr": 0.00849393752443934 + }, + "arc_easy": { + "acc": 0.6452020202020202, + "acc_stderr": 0.009817629113069696, + "acc_norm": 0.6388888888888888, + "acc_norm_stderr": 0.00985601342581124 + }, + "arc_challenge": { + "acc": 0.295221843003413, + "acc_stderr": 0.013329750293382318, + "acc_norm": 0.32849829351535836, + "acc_norm_stderr": 0.013724978465537378 + }, + "sciq": { + "acc": 0.922, + "acc_stderr": 0.008484573530118585, + "acc_norm": 0.924, + "acc_norm_stderr": 0.008384169266796387 + }, + "piqa": { + "acc": 0.7399347116430903, + "acc_stderr": 0.010234893249061301, + "acc_norm": 0.7453754080522307, + "acc_norm_stderr": 0.0101644322370605 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b54274993d3978fabb16c43d13316610d9ae84e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36770a9c49d0a3a60c79eb82a78c70d4f942375db450f6bee1200697e875a032 +size 208731415 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dcf37d9a075a8457a3549ec6bca1e6b9a7483fc --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33712a8ff325e2fc2044da6dabb0b419cc4ea59d4bd3e8f8a38cee20f3b3e96d +size 208731415 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1d1807539aba3e3391f9fa3a4041d637ad12c09 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_0_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b89c60bdd78bf10743b3493dc711f4b49a4700817d7df211ea8b8757577bdfdf +size 208732183 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0c92125d991072c09a4947f502b712b82db2620 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9642950064fd9579957f1e01fdfc795da6d061e71c0fc725e896f74e764598ba +size 208732183 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a3e22a41d2aa0c0989a209db61c0cb81dd5818c --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:024165be02a40504a57d67449adfe5b95b52ecc6979f1d79b02d1fd96bbeeb89 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95c63fc027b8f0c9dccc42db615f7967e2b66df1 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b01fdb8c23c6dd095f21bbd82160ea8b1f0d0861306096ba75d424e4899fe2d +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef428d5fbcb99d79e9aeaa544ef6f499149e480f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_100_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:577474908785b58dbd496d8dc8b7ffc34a5a01f093ba9f945e9aebc60f2f1fd1 +size 208732269 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04b677d31e895d3b27ca3e498dae83d7bc32aaf6 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_100_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f13df8414f244b1bd00783e318424cc28da32d327c5bbea0db222418a7a74e5 +size 208732269 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f98b6e21fb17545f7d562215e2f496e6674f980f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:276e15e00758dee039b026d5a9e975f273986ed122552bc78ba3e71b67787ff4 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c43662525cc8c9eaa383f47e131114196f60309 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20a00027cd3a2740437f39e6841365550c2b9a1efc78b00dc1feff2952a8889e +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..673570dc7c953b20e0eb84814f7fdc4c393764a3 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_101_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:129fb57f2cb90eba983a571527636139bd321a0eb66c08b56b82f3070a390dac +size 208732077 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5e1956043a09a491c1e564b2b94e965e7862dff --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_101_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:718bf8b8a00d19f71399bce2ed0fed4360e4fe5239966bb76502e9df3832c65c +size 208732077 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24ec83f3da35d1010f4829a3fba3adcc9e56f016 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6ef1c6f4c53131193482f8760b1a781143fc44cfad8c111d2990801b360c140 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e63f2d569595de82b1d4e2732e4e84b51044f889 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d14159bc9005b5364968b1af39eeffa0cd0aaf65d27c557081421258608de3bd +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bb024be7dea866c6f0e3281488b3d59a6b631d2 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_102_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:380d0b75cb1d71af97f2cb4e87283826a2f9dc5788c3630e21f4a569a4a89b8d +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0bc6d253388e6ba5d9725f34274f2809c36fe1f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_102_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27d125befc93965c2a6c6544bd39949c243044cfadddc2f5466d04d9694f71ab +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20bedd88745355ab7836606065d1c70291077d3e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:746562490fbfc2e014ac14a79e8fcacdfde7563cbd6546785ad1b49edee08b28 +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36e7cd5255c632542bd52899370e43b343429e93 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b2f99da59ee9ad2c05ce55eb5a27610c9d625b0c35107f39c28162cc924ba11 +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7002b2034fa9629865e14d5a9e0fa089676e5933 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_103_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfcb8550c417e9857ae659c838292fffdb82b65d0deb805c4c973bc6cc33e1ce +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a2a9b21e0f8d5b8570a1abc7ac642672c3a5ecc --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_103_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8b9990f7695703dfc8f750661e453937386feb247d57ab36e0f60226199c2d8 +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c736dc4844c27ccfe58d179ca1dae322f9e1d165 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cd75df19fb6d31ce3f91a1e4059a882c0577e40be6048c8b5df9594f50c0b35 +size 208731501 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28176433a50b2a929a360b989fa48dafb18de2eb --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c22d8301573cb13c7c5df4266771300dcddb6d6aafa3c1b60806b3371ff80a7 +size 208731501 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e250938848cb24f3ff5a9b001023738800a11595 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_104_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e30e698a602faddec17b6a09692cff53ce2d8d3a1bed19703308943c2a0b88d +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..111c4b596bf5907fe4be0c7edf35d946037c2284 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_104_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c3a7126e221c0683d2ba705a0b404012a6ada3d2c1a7c20eb7cf3556563ee11 +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59b37b4e758533ac2727c688393175f381699005 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:045938264ebe524449bc7bc6bacef2d774886a674131e4272b1aea99c2eb1ad1 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c68295944124839b81a96cac47620c9d1cf27aee --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cfb82b7ac7b2ddde1f7577f460775ba4b783714941fd0a07a2fcf63e979f533 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..467bdac951630cc8e241a5f3fa896d5561f04f13 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_105_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f204a6678be5285537ebaecf07d9299b12d3e5e8a53e9a0b3d56d58d07cd347 +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fe75c79c147752612df08ef1e36074745bb26af --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_105_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b15bf35d896c56d567809cabcecf69d45f657131c31bef367599a7b93738675a +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e29d8d903b71dcb637f7f019e1d829bba7bcdc58 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05c96312eed3f25f59509694562c0eb7ba524bfe9c7fde3ef0c88bd1011d84be +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..508578d77ba7a67543cb7d03e3d446339c04e543 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92e1956b053802766fcc6c4059bcd90d3d0ddc9a7e7625d3f3233ede020f4276 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20c8f11da6be6113b1f603597513318cd8f61b54 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_106_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67801a901b50e35bee2456f188d7017d3318510c67c5c98edbd1ecea1cff6b6d +size 208732269 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..272b7f6540b6bde31dd894df0d3d066d38ab7e0e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_106_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a638d387239f071f54b2d338d17d0789079e52a28183ea4235cae6330dffc88e +size 208732269 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2faa6af1c771f539532f4e21ae8b6cb7a12c353 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b08aa26e9e8858de96ba69116155ab84249d0408f07b0bc8586a4c0760453870 +size 208731501 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d32ed7ecb3f0d2a1755cfaa3bdcf76465321864b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3682b9d8b73ff01b37e67153ca1835c034c1a23c75a80f0bcd82e0dcd149389 +size 208731501 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dcff7db9d697ff3c24db090a3274fc275e02c4f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_107_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:263978310930aad5099d7a780e00f76bd8c6c407c4183e1abe3bdfc7ba03dd15 +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8a6a8210a7807f6437afca87ac43dd99f38ae06 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_107_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91d1ab9f3789ac23b2ca424c43ddc32d5d942a6abda7ac4df5db80801c8655fc +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0b068625d0f0d5df4b551e7ac738563268ff445 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a39eb5886ec49590955403870af121384251020972ab6bc9bfd31365f655becd +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7147f7ff20669a8e85497ec0c391565c269fb851 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84a6064ca05874d7d49ede24270739a6684d088836d8007b1ad79bb2dcbb50d2 +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb8947e65223aaed745b0782ef995d042d53b244 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_108_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5691d01cb1b3245dd62427246214b71bdd9f7fef35d547121309f7955460489 +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e6eb749b9a93534dfd975191c014daa1f119259 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_108_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cca0d6a7ce7e8b304e8bae335d405fd600ad733dd651d390ceb8e0572b630464 +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f958f8b6c39c878318288adfb40a877a0657ff30 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd68f29e254d7e24ee1bab1d006445c220f30fc39361bdcba69ec9e13e50de2d +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40d94144d4fe3821e6003c49d3aa8d922cb8fe6e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9493fdf808fb76f358e7a6cb6435c99d55aa4127c22f2fc43bc669da67c03018 +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52669d602ceb2556eb34f878fd51320609e18497 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_109_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7200d74c490ef2d97708b53fcf8b2fee1f4579c47b5487e2678085c399584e0 +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4743c67cd9ab7bca3bb6531fe3e20b77afd69603 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_109_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1517735afe2a57ed12ebd2de027fe105b5a9339b79ded0139b3ee756721590b5 +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a86806ff876aa8e6ef200c5c9316d0dd46d4c37 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a95713aae5d105960ac6fa15f561a1be8f23441478a53b5b9eb8e30ac699cd5a +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d40f9f383b136ac9fc8987adb7bbc0f538e0706 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e83934204683f024106835eaf0d97854991bae553c15162448f70e175678e11e +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f110f0cb46e25558f0501d5a55fe68706b3767f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fa6ec216934551725bb19537204d5bf2466d877c8d014e4a71fb5c81d97eb00 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c1adc459b59409a14d721844945caf838ddf562 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4211ec3e6de76e9ccb7e6fbdab790aa7738bbced7d58ec403dc424bd85d1e132 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33749e85359b517708d2dfa42670d38a1f5f561d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cd44a2acafb9e3faa933e6f8514287f1b86f914b3553fdaf56fcfe5f8efd853 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..621e61385de00aa4bb19165f1eec9d08c909851e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e77c80218ca44a9881d04f6c25e8431e3921b30b719f43070518fbc36309c44 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec9e16f85573aefbf61dbd068cf6280d5ca1a714 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_110_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34e1be80e51a82abee898e0793420ea25a404ef634dbff2e147b56aaddb46398 +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..540f7abecbcefd7ce4c5f3f5c8579c00b70c6e70 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_110_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50b53b55952f9d2bb0bd691958841a6ca5f5a93dca63d20e7ac595582d60509e +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e370a8c518e81123561039efc1da5a7a55f2d3db --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c20fb1dd3abc7e60167ae805c9da01fbd001252d38a88828d439b2fbf4cad0 +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e258b13dd1bd7c47ac8401f3aa3a25869d6574fa --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b98c83b16c076ad6f72b9df986c0ab0c412bd5c6a5d426f7009948e94fa38b99 +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dfb710b6e77ab6e2545a8efbf490ac35dd4dc71 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_111_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cc96432475e46a920fc626f59fa3a5e245957575c3698a7dc34f23dc93cdae8 +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea34160bb0ee4c3f73c24e307d042e5b4b4422d6 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_111_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae5af1f95c18510d872e5549b1753badfba9a0b55ad2577f17070d0d4f090b7 +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..acfa308120487d5da7591b3d9495a3989a9d552e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4afefc78af864f2cb8ac47bc40b5a5d637f7c77337ab6976efd0e9e323d0330f +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f1355a7dbf77782cb6bc55cbea32bc5972ec31e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b74f5beebc4904b2b5ebcef3ba3cf5a303b2061ad30d18b59a29acd57b9c6e48 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7131a4fe4b81b3ae30bf220e9a43d27833213184 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_112_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba1da7db8fcbf9441fdeb01cb85dd2887956939f8d65a2a7ee87092bd39f2b59 +size 208732269 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5745eb3d3ba75f1286ee586549308f8c56c64514 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_112_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa568e9b1f5302bd4632d83613f7adecc05c47b24ca2d4760a064bee7b1429fb +size 208732269 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb0f5c12ebacea5b2030614e4492d5542fec04c0 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73333fc914cd00bedc1fa2d493ad5bbdb5b8043228fec9a0914b7b9b3069f2a7 +size 208731501 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0536317d61661b00f99bdfdbfc6d3999a86911e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13b60006fa096d1f48427661517832f2c821d2469b0f0b94d94f0775d84bf4e3 +size 208731501 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..318f57cce5bb6bbd18197f53901f3174cc65e7c8 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_113_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a081504cabd427a4df61437b469bd390bea5c04924010dfe6b22dea28d3d230d +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a1e200ef3a380417d82b4c2db966842745d2221 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_113_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64e5cf05282867bfe03b7de6d7ef78d2fb05fa4f2023121cb37b923e44f0b0e8 +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40e1903c70b49c13c79fc8f19b1bea3a6720d412 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f02d74d11041f5ac759621d6edd3e3110c95b9017ead19c03d8ce13123efefe +size 208731309 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a75887cab60e4485ecea7b585073f6df8af36beb --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3357212988d739ba82daf185b7763eacba4594236e9e9c79d461fa3d9367479e +size 208731309 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf5b0d261af161f5da299750735a40e86e7d5efa --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_114_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23a133292a77a4be142c6bf8bd6352783b756b109a83a493ec4c6f2a6311c178 +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de9246122827de621951726f7e06f7080cee2389 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_114_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3161842566374ca990d2b451fd5032e4f08addc9932b3dbc4d85078afd61c7a +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73079ff5cc3c274358efc91966e97156dd998684 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6310c09c126c3a241a83bd545379d2ed912cc9af5d37608b25964e6b715b796 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9197d70ba6159870ef3a28a26707ff4cf045d1a8 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ec5b0584c17268a11d9dfa232bed922c309a3e29a2f8ce81d75fdea27ed625b +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ed059ad9938bf3204b1cb953cd40f941ef8b5f7 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_115_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc1b319dfaf22ef3585c60a306ac795917dbfe54f1c266c1d3f8c87114c853ed +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8a1df7fe07413fc16168c69d81dd5c89897fd90 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_115_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffcf8c89e204da0560f61f9779c0dc3ebfd888ffecfb7896b54f9772b85292dd +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..785c56636443a7cadc27d5c732e0f6d0a8ebd952 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70aa878e4fa2cbe2a49cd57d06a91fdc412dacefda17468752740d8e47d5d6c2 +size 208731501 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1921efd94862c58752d05b8fbe48ca5f818ee7a7 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1700c15a4161a8037927db92d905096d534a2bb177c8967d254e9b07d81bf66 +size 208731501 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..746bc0ba6516ba817bd13ec594520d074c463633 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_116_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92700692e204db1e17ce0ee76f3c8228e9930c9c10682d1e1b02c2a6eced4590 +size 208732269 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..262b0c3ae640bf6a523e8f9efa4753d182147326 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_116_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d06a6da45d32cb7731f4d6307d3f78a9f10dfc3964fc752a7d80413b8edf72f +size 208732269 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d4de18da8ada2ee51af1452856ef9e4fd87fcc4 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24602f6816ce8c43236928ca1a1faa613dad9a4a99291b39578447032913eab5 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91eca342ba2e8bf8f225167e48c6136a4b3915e4 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6931421b562e153d5672bb828f2e2eb3c62525c1af45a64b7bc964e0f3f5f590 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..048d1ae47722c6ce0d9e2f54a62ccd7857ded0dd --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_117_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b91ebfec2cd281f589f867410afc095adbac4f5df9d3eb2b101e6b5d367ff40 +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f77771cdea2a095e6272310894be34aafabbae82 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_117_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:742e1799fa53bc7dc911f518fd6780552db39c6d39d94d0d3f6cc2aa32453950 +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fdd4180318e0383067ea7d503cfe83ad5f34cf4 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:606b5d51514dd329db027351f82de39de5c5257331874446c5f1f107c90fa220 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..654718097d802ff0ae86aee990e7eb8f5147007d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1ad3cd97cdbfb43a3790bed97870db39d34e7efc7f492db464fe9692db99b24 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..979757c711cbe7d58127ed9da6fdf0df99141bb2 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_118_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b14c63ab8e626595874639c291febbaae7eac0929501a7e35f7f4f5b60c8aa4c +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c93d0f8f10c8068936046e1a9f5283a656eb614 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_118_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fdf6b1d7339bea01a1129c4797bf6a295b6df8e800ecd71914a0314d14dfad0 +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22a71aeed7e0561fc472929afeb14526fc806c3f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2afa0ca1821f7f440ce264e99bd3294e4f4fca00f6e6c69588b463c55a706c1d +size 208731501 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26d6bad8b8c983fb0d2d71d9c56215f5dca3135e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2548d5574c93c438a5ecda670974c577d773a3800c61b79080b09c22a3afcaaf +size 208731501 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af273fd90301ba927b926a1e26fa3bd031a4c273 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_119_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b264bf0b48c49386a51819c7e15133ade3aad61b1c901029f7dde907acd5105b +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7615cd63eb4ba7584114a2a21b13a50514808ee --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_119_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b621d6130fe3a4c2f5ff63d4c2ed186508796dceb689db77eda4a33df4216ef7 +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c22e6649aca7705075c2975bb072a3e7afa3ceb --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6088719ca66e8e79f8eaa4bd015a70fc238480be9bb3e6db1b9c3eeb696de5d5 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2515ca4c8938b08e003ffd1f3610d8bb42b8c71c --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20aa71b7b78f1aa31848845e06f6e4ebc32d517c9a9d2ae35e0d7e88d30788c9 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09d700e330145afb0a0e0d0b4e31670a2bdd05b5 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c910f332b64cd5accd336ffec385926061f4f036e84234a8f1cdbbbbdbe4afdd +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07e3da0eb64d536ed09ebc5cccc5b07d3cbe08b4 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_11_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c08b9518e7021f8b4248b2291705faf0cb74fd01be5d876c8c95f3de8c6ce82 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1db70ccdeefd74ba2f00006e84f0faf0daa14625 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbbcc4fc86cd11dd686de606642cc5f98aa5999864c4738089474548c65f85c6 +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85ae6ddb03baded6a95af353a56d941e23287787 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:249e96cc12cde36fa7a395b60369c36d6654304f17a68ccd04468378a93dcd60 +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99df60b54495c9801748e4e9fe18d0e269f69a9a --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_120_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a8f384167052d00d9db998fb741b38eec30e0222de4011b76e304ded3d9ae6a +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23297b215d88730a81428b65355c35d41aff8d1c --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_120_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:176474c446e3dc65a3401c54eefb644fd9b06caf9e8f87eb98c65af3d029998d +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..292a0e7a293dc2f312058b3be80b6da7c6921d1c --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3aa37e8b89bf8654e7379b12d133fe3b12b2327021676e575a83bd8dd3bebb90 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3faf4041f7bbca10b497cab11957fe7c9ff98952 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42c7b6f9108047ed1f2adf87bca300052104fa2631f4517707cb03e173a2f887 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a117023b9bd9127f59125b94f5fc43ed435ef96 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_121_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51d6fede34f1bc33ff1f213752ea92e397f32d6295d6212a2f0caedc6990fe98 +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2e9d5778e2852c5ad53597bfd4841a2806b3f79 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_121_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e889901083e49a46030d506761f591803c80fe132f7227a6b85b77d7f5cbe03 +size 208732205 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..921f0058608a0f0052ec3995d788259d94eb8dce --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:452e9d10c4f7e8deda288b7931cc52d80eb0b1aacbc5bd474702178587f444f2 +size 208731309 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eec6305f909e2928f740ddc2df83646b3fa9c667 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b31912a5444be71d6b4611808dd901ecd30158ec3eab736d76009547e050910 +size 208731309 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..458ddb5f33c544ef0f8d9bcb43db154fb22e6283 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_122_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b027e510279aa6873ad0db61f66aaa69b1ac2769611cfa03c973b677c3d97b6a +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7aa72754e76259cfbe3d55b9bfc72366fede956b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_122_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:444ad159b8ea85741f646b1a6088ca481efff39d5a26e744e4bce1e2506af2ff +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0eb46008bb023a0e85e8bc70a4a4be5ec01a003e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d44ca2bcab3e4aa53fd92bcad815941900e92ec387ef2183696b9e62e99a3c7b +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18e72b8a9a51558169ad72318a1d6d7fd3e2ccbb --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d936c205935d45feb8c925b03436b1186bb680bab0a0fb44ef6dce5dbd2803b +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..feb1352a2c63d696ca8d16437d93c8ac072b5a44 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_123_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f68163bf9a18f26c57759e49ff5509e4d236317e9ae959ce0a16a5632e4e6fdc +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3da5bfcf425108d577a8457d5df053d60abaa21e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_123_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d57bf347471d9d884f93544e84f0152f662ff8c32baa1dd0d17dcbbd6e34f2ec +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89c4b5ca95ec1d577cb3c21f0d3774f41390d930 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3c4c7853592e0c4a10e53f0151a9cbaab524e089b0b1b8f181555c4d5c0f847 +size 208731501 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e1aeace1142dc6a3bfc0ed695236a4a6cd432e4 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29bb7372c98dca9298ee905b2f342a206d48015430af23abbd00460371b086c0 +size 208731501 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f924bc5020f66f96a4ec2ca59146ab6a82b7ba1d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_124_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9d3b6b0f4989cabb6add8ab3ffcf208e723bd02722b8bd9b033aa0a122d4e68 +size 208732269 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efac4b89791e38ef7b2a5d2ecafa24a96049e727 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_124_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bc8b73510d7354520d4a10e02e598e2ed29a700b8c5832e74bf0368c3cd0f78 +size 208732269 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccc948056aae36f69e9516b2d7790faf2ae73f48 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9796679c57fa3b695c6950685a2b0ab6c541414b888e570a8bc261a68d70d24b +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdbc88ccf87580abd877136cbbb868c8616c0c07 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:144c120a959c5125022634824b3d9cafebb280a0d88a002dcbc88f7b47154c14 +size 208731437 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4327db80f638125bfab250c237fb496b9fa88d2 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_125_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36a1012e31d15978a8b1ad65dd35d6af8fcf0a295c602f779b986561a7810a5c +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db002b1dc0203f6302016887a167b1477f278722 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_125_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:895034a0a4ffdfef77ab70f7d62ec4584e6b7ba81d1605a226151058a5554738 +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb59cd8743258b9a6131c22eaed497505a33fc8a --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a67b29fb63e963ce36c75bbbb445e07a3a83e3e66222fc0c80bc3ccada91a8d4 +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3af1dadb07f6206846d31218fc7d2a17d79fe503 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22f1cd2fcb26796e9eeeb5b4eb41bd659c792052be3949ad72200445512b4d2b +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea4ff672029064f8608aa0bb96d789976b28b102 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_126_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:554f096b82957ce489072292202ee675da5b0440d9b46fdf541b3bcbd7e4dfa3 +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f44f675db4b07a02c2fad54f1e1d57e87ad67a1f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_126_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40eba667ebd5c257b8d95e25823715f78d16c71b8b9c3529e3e32671329bf23a +size 208732141 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..030d8dc06c5de0b155543b15d2d7da5ae3869ba3 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5725784dcd1f5b20e5911b9a1ccbe1134de90fa8d8aa4726f0ff61688de810c +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27c1da558984591fc64d32ecf5d0b9b641df0ced --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:897dbeded3391668d8fdcef21958d4ab30f6600f0d86cdd7b40a818be1d42943 +size 208731373 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46ec382899072393c22787548fb2efd754afc3ff --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_127_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:572d3253a1f508b933e820eb51419b95ab27663b8722de5e2e8b92fe51370af9 +size 208732077 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fece71167c770ad2a80e4ed270610a712a7064f7 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_127_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:917edd21b5547b5c2d1f3ff45e4c9223adc255ce41d7534e8260758540e68118 +size 208732077 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3972d5f68e89421bd5c09a23aa47ef0c71f8a873 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1293b621c618d2ffb1cac96048016e1478cf6d721f28eea73ac31528538e4fa3 +size 208731554 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..846ba7efd57e965aaf3d20b71cb46cd698d095e9 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b44a8da30d244902699925dad56cf7bf656c360e4ef7592ba30ba0723a40126 +size 208731554 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a045789eddbe3a13387c585a18cc80b8a540c64 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b24cd9fa01e508fecb676e34f7726f4d15ec69c5fa374d694d904ba55818c11 +size 208732322 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa11dda2961e67474f294746c5c7851cdf0f3b89 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_12_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b9a37963de85a50f795c7221a284571e9d9f1fa7ac3a959970fa1d93486aa0a +size 208732322 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..181a3640e162ee69ca69d35b5441c4a8f598737f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e82e911c3a0e9892e0b46d35e86c4984ff227e7e451c28ef67784caae0cb1e47 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23bc447de4ce03f243f63b910c55cc4152c389cc --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68f803e41ec8dfc9971513072d2460390641a80987f8506cbf400eff7146a36c +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b9870438c7e5fd83f81328f4222bc60b23b2709 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_13_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e8009774400ac578e908371b896b485379dfeda496bebbc3e8004ae5f82f1cf +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ef48c05c2109edcf0e2c48de365fa78ca854280 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_13_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36d76c47943da55bd5518b01073bbdc3a9042b9dea4493a6e96dd8d3b767fd0d +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c19ccc9f70748f2138b6f3c41efbbb0a50d48c9e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60c20edcf42095e15c008b9fa4217dc88ec0e13f6e33b655e4911c4de0bcb9c3 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb6088c3db7ff70b69cb804401c65f7038d7495f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9453711b63c2ae8acf2391e5c3b456b4b43d1395682c9c6e0d226b039a2fe5 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c040d22b7e81f86495a5ba413381b70933c81f07 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_14_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7f64ce60286ef1c8d6b7f1d67c97f085ee9b8ee2b5c1c07f4af631bbfad7c8f +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df19a9a332c106d5b857b37c241a8e4cb2282b4d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b90f65d9caa12f1d559299272f68b89db46973eda038aa380e57ac369eaed99 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb05d4dc4bd052a5bc7a2446f72c8356d46160ca --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0344726b5e3a4d93cac225603d41c5c2c80a56651866bc515813f0586f6f2a72 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..edc967296bb855dbb14c54a52b016e61cfc2ceaa --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e73e58d9403ecce758f39331186c2cabcafeda7b64b1a9b1076b7722e5ac0f25 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76956045178a9a7eb17df71febe1711324f6d162 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_15_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7010bdd9aa7597118bc2b7f51b5c72793f19304ba464183eccd37dc280d1a9f +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54a7a9afdb1ab2cc20efba83f5fbf85f08c40621 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5776e72f3b321126c32882455115a462e1de97312702d074dff801c3b3084fe +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b532b5bdea81e4d1b3fddc66ed14f6f3e2a2cb18 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c74d33003373e5c557d29817329c57fbab12890f29a680b54cdacb3d0733d292 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb5cbb546d52f339daf15c6d15b8868ea4646219 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d898d39b66231dafab2c61201d938274445ca74d4589f342ca7033a0c671f0e6 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdbb1740ccd9630bafaba0bb430b9cc81ea2797b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_16_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24489f1105fb1bc212ab5df9980cdf80359e087de518cc6f36178544a3e624ab +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3e660071dadf2f4a5771cc227007f0a1594e2b6 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_16_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f00abb1fb1a321f13804777ed6af659112dede0f389587d61705205815d2fe6 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb05c948bdc48a3df5764f4d29fb7160a4a92f08 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32947bd8213b6e364e13166865884a4b1761b3ae5094d6730afd9fb4ea7f4249 +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba3064662aea0018083a3b1aeeee4842cd72f02f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2b6e0050f0f8ab7ec2bf0a7f4a68c7987f05d6b7131b247c088f5c08969d98b +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bda2c76eebb18b2fc8966b75e73c4c609b8d985d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_17_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e07e3bd27f5cd448372fc1be4c5f91a8b22f84f1bd1851b4e7471741563da5d +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..636f6c1ac7097470a41b97df55981ee868881e13 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_17_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e057032a12a12fe42b0077414ec08d7e9337f3ba549d0af11a1c2e020b9cad3 +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d80b0c4067e384d3d8dec064515a569116fdf92 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be29b5684d2e5b8293b858b7e86c9308b72aa32c677682d6217517dc2e56728f +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e16bb050dd033946e23433ce70ed0fc7738994b3 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6bcc06dd252173b578fe86414bc4711db70804d11c340acf3c07bbc9ab6bfbd +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..649e414372e5c43c5f1504429c83a26778f4df84 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_18_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:584f7b43e5f0b8377b6140312f6380291ac627c8a698f7717ba555349880dc98 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1ee0ed02cbd57f0f90bd03055f8a39fb3c6325f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_18_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e950efdeef4c9fbbae1d1f16db0bbc0f61ca023fa74ebdd2a41d9e9f9269c6d +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98d38a42a744d4f6dd3b03e41d1efa36bb233d16 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d3cf13d874ede14d92265866d46cab4540837faf7c711ba168f3757ac1222d7 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c752ede2705d2ae9d8e54e1ea82e94ce65ec582b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4032bfb1a1282cf11e18bb28b3dddfa45c7f079e89adf49b4ea79ca075c1c5f8 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db67449d3e3c07ffdb73ddddd6a4be9d87898f8f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_19_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:607c46d73561d37a3ce9a19d0f2855f7b65523aeefe6efc7493964532d72ff33 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a11f6f8abbcd30a8170cb73ea4076769aefefbe --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_19_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf8405edd1f949fdb325cb9821806b40323c99b49f7cde9b7f5cfe257543fa69 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..552dd5033993fdb4ce2941052a6968c8d8ed39f0 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f2cdd5d8839aab60493a4e7b4b860d1355ac13ad6a6861b6a78151d93677920 +size 208731351 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b949bc2d6225ac0787976b0e7b08740368bb3a6 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fbf699f3ee995a63845d9584c33fa614e7a7017fc351ee4d77b41d92d84b050 +size 208731351 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dcb5bd008ed321c4a6eb9525fb74e96aa6d8c19 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87132edaebd5cc520ecde08042635b93dc5dbb5fd15c20a3dc30dd45f4f646fc +size 208732119 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e64bd258c7ec67327677ce3219cb29ee84de6cc --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_1_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85e0e237caece35d9dc17b9ed2478cba4de06b53f27e895725210a39979eb0ce +size 208732119 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40f0ebf632b6ca2a4449f39a3bc56999fcbadd6d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c445b33547061eaecb0d8d8d30dfe3d815d49c311e177ca8958c6ee1a97a58b4 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71f867edb93d32c18884dda16381ec4c8c38b99f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47f5a77266d5faccd199e975106ea0eef2971b9b2722f6ced2d61b98a6710c10 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b8384c1afe5d650dfd86c77031dac1af6a96914 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_20_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcb321fe5d453fd6f09326c7596d27d7dec9a7ecf050c87f1f396e9e5b3514bb +size 208732322 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..171d9e32169dffd973b86a9754a346d6b68186ac --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_20_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec02b30815eb5c6e344cd520fc70b0f40934c214a354664ca128414334a4c4d1 +size 208732322 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..876cf5b0d2a9ddcf072c943c57d5cfab16e65098 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8da3da234f6905b12914691570ad06553df88313f0dc3f8a9f6127ba9307a9b +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..240e2b51d357b6f4479757d82223a03b43505ebd --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11fec34371e3f94df1ef6a26e28f6a2017f6949a3ca5ee4dc182f62ea4a50c68 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d4e806bc82b2712413f78e02af05fe91cfff953 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_21_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:526221fcda7299fe9b7f32938fc4f12ac4921721e9f3df868e1be5ce158d7c80 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30dc9a01cc3989579c3325740203624a6e156271 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_21_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f99831b4d745ee9502f48433473dff4a5795b5ce5699581b52cef954c0bcdee1 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92059bb1d8fb87934ad4f4904a86eb2a21fbb3c8 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6aa5d9099489fdabeb70ad721b2b10bb8959abf6e254368ab5a8efbb32ec9678 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ab46fb1796610ea0fdc2a7eee810e1b6db1e78d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b035b30c762a932910b94792af01f766b9ab36ed996541886f20a777a43d5742 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4333f818e560a4ed37c6107f98522257727404ca --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_22_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:970b52945c85c0262adbd5b314adee5c0ce9787b53eb0fdd1cf8c3a654c6a593 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3960a402e075c321447cb0f433bb57a0c3d27a01 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_22_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d0c560dee798be81006fc676aa27d9443a9a63c07ca2393f805c91bec726a65 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfb7f3f3ad50d8aa86c4beb9ae20adc9767d86d5 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e8ea1ba58a2089812af5bb19038b3a6ca56cd9cda7035dff98b2ba963ead657 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68e5759c98a471212784694cfeb152151b542609 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:604af284dd77d271a2a8a0e6abcc824446f49291104db541910ba8c7f94ea3b8 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da25744686a9d916b849e052db668cc3558af0a4 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_23_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df774062cd88e47bb6ab2064d09264dcc46390cea0b91121a03407de7638c807 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84c942cb4b81c2f47b744ae9b7bd6163b0342b6c --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_23_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72b9b582d7a8a3848fc0a40e48081b03b1524bc268969b0d581b2ace42f85448 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdb391437df360e8f4e03d59326cb140265f6d83 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a75c786aa1290e3ddc34f945504f632c49c70a3a326644f18fc98fc933d81868 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..339f9990c35bc031a7c7ab208db962cd661cf6f7 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98b90c4510fd620c00c1d0f6199346f60cdcbbda000e32e6bdb9ab05e5837fe6 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bffdaa339db941ce0de9573c99bc2ad059d48e8 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_24_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3213be8ca08cf16725bfb88dda1d7a2087b41bd06fdb2260098cf1441a2c8302 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca62107ce549f763194d6272f5405b3e441d76ea --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_24_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f09e334f69cccc5f3616980bb4dc31ce303c342120c1389ceb6ff6df5a93a9c +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e78bde42a75627d247e1f8d73482e9f7d7242468 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c623a8740a584056541f3f6d11e0292ab33c4152b13b452396ac5ccd75390f2d +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bf35d41ada72a0858e12cbe48207093008506d5 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d9be4afbc69f84d5cfd34b8786c94458d708517c097494b09770ccd494bc52a +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3aa43a3b9e66fd11df89765dc2241b8fe568cc7 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_25_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6825d799f2f882d36e7f0be29114549d8d4a29cea7aea990cbfbc9e1d4c57800 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..957141c68396da164a1dcab343629a6755868c94 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_25_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3602ec30f909ce8d592cd7af638efbcf4fb988afcda4eca798fa6b4a18d36623 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5567da827a952b2281c9674bf46e354d72866e5 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a16ba7711f036dcfe0d2ba97ef5af16b2322306222da6b4b6b3f3ba7daf4bfb2 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..774a36de4e6ee9af2c7970152b8951f05bdde39c --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc45887f41c49815ec0fc0ae7065cdb94c0c41cf4d0c90fa9662b2295a0437de +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e88909550f82e5f07d674b7233f2aa095f9ad470 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_26_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69cfcbd952e1eec39b9dc57dc7d943b128e95c62b6fbe92b05398716fae2c7f0 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59b6cba94d2a929753d0373f6fbd22a5779931b9 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_26_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad485d392c3800b0fde26a090f4ed397fd27397153e708403c4946b8de560816 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c3fc241c5bf7b58da1d97c8b5dc9dbc4303c9ce --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6a3a2c3ed32e40da6531f762efac5ecea3c71dfc45023c7b7a47433a5fc1347 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e928f77d8f095a331694f4ac6c011aa16628dd12 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95187fb75fe1d6723c956430b4d7530beb1f5929a96c9f14678e39bad30207a5 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..918654e12b3ba8a8a5c0a78d0ce569163e1a838d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_27_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75f6973e0a1f89b75dea06704607c138a2e3fdab7a1799fb8d426a4f62cdc266 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38fbef392d6a275fb03eae2f71e34d1205fc2485 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_27_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7435bde6be2232ff33efa7705c0c689f72e228eaf7353b3a250190761681d773 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3133c8e9d3fd26b9db9d9117fa2b753841a9fed7 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01c08415ade5ea3f3d22d05c203b2a1de713ef13c3de3e74b8d3eca17690d065 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..298b42c4bc8a52f6d87e5706b903848acf06d702 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7de840bea7fcca40c851ab5c895d99f27bcb4885d376feb9ec80b3e8f807dff +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68bbe9beedd123071c4b4fbf28c6d49439da8ac1 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_28_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21c783f3ebe948f9b0c03651fd4256ab1a4f96d19c637bbaf19d0b5302471c78 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04ff90d9aa6b7f568771bbd5da949a6ecd36adfb --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_28_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6653eaf4c6de2086e61c0132821220b68f46575dd599d55d48cb19f212b72d1 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43658e1d315115ef778425d09e04ef57c46e95b2 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a890d7869f87a130edb13ea12ffa21f0e0e7c5a67ba1ba28ad4548220d39e48f +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..066d880c83cde1b7390e7e66501c932d46ceb5d9 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dc76e9c0e5a58fbb03edb661fd3c90a20afe7e9bc82103c6099601c0f487839 +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dccf937b2b9211b4001280f9b468f8b0fe23ce28 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_29_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f94cb5411de7b1c9571a0dbb282348d238d59c53ef9f18cbebb8a98112779a4d +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dc492a766a5e55c27d1fedcfe35623b69e87f82 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_29_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:414c39fc2bfb4ebce24c641bc8acfa1b087703171fa9846e59355fb92a8097c4 +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63e43e601f3e5b4ed413b358ca3c766f0c3a1008 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af45e8161415c70887693ea3c55bc02b6048366c03adfdcd2cff30bc40d8244 +size 208731415 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab08b75979bb8552516e21b409076f6ea0247084 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bbb48cc5326b0579c3c17e7d975e1b03a257baabac6b034cce850f1c80a388b4 +size 208731415 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca87436b1d29c63cd6b7f32ae94bd29027418976 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f58b20f2680c2b7fa1dc6309525a0743162f6651c6719f55e7ee8ce8833d204 +size 208732183 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8274ddaf01f052606c1cc94c39ca386445038127 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_2_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cfa0e65a92f405b673f98fc7bc48bef878b9ff6713fd0ee87939f8d7da0288c +size 208732183 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba0084e3e1b78bc6ffe6b50ad875a533a7dcdabc --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29dbfcf5dac7a40dfa42438a8fca0e32d217cb57731a7c018953716b8a23bf36 +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a5a82157f4cd6058d730b2963ca4288dc99b918 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e3d85c86a3ffa006049c45484ac7bf836c95700b354459c185f7dbc6d8ff3a5 +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37931a1b61822007db541a2a22236ff9c9e139ef --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_30_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8913be5861acbbe8a7cff0300ada868443d5b98fc58e35b68e598050e5af77eb +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c680b72e9dff2b115fd6f62ee65d3cd31d935050 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_30_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a58ed5c764f5eb4fe94e8d7a0c3d6ef1271a86fd4e7711cd69ffa90df104669 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7ed04906803aae5be11f77519d8372b41490786 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a13b39032a7f39c54cbc10af476e56043e1e95c0c30bd0a064c383fb35c5ff9f +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b093952c2775e0938ac44cff45b265d2fd95ed4 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc0aa8af336639b1020e57714653122c5856ab24727fb29bea0455ac7f4c47b6 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57e508a9f54bd4e99818b393a755915e6fc52462 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_31_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de1f75fd351028ce180d7154aac35cff75cd0168cd59f0f7c7bd2b28ec38d0a5 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb50488de9675b7ff8dde335bfd19dfdcef32aef --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_31_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51a3a82c040edc7b4a308df78f0d41267b5b4ce7186a0d7d1aee0b09dea5f287 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95b46794b91a6475787c84940519c67e8ec2d08b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf42470523d095c0f6ea363af513f3962cdeb7da83cb062925bf2a741de56447 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..529055ad71b44aef2c18336270258d8b26767d56 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d477c214d188a21bbf5876c3e5b161ba2912611692d87fe8ecc2a6b05d62f58 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdf71e2c58698ab34201e5192f4f772891b6059b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_32_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8735a7b4544d3afd29b8e3a0d1bc5f7c1b7dde4b5268c95d8e0c3b5a50915d18 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fdcd28c27dcfb9be466b8229b986c17d7d3fa46 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_32_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96bd893e8a60ce3f1cfee4ddb83a51c4705d7793dfd9ecdfb2726dcbba3942e1 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..217a348cefdc20979fdce773392e8193b75e4fec --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c63fc149c149590fcdce43d7322183159392f73e00b8fb4432afcbfd5deb7bd1 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37cf4c6581ce442cae6538f3ca14607d7f07d506 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0747f01aa797a8f6b514783b4e4d738148b549b0b31d300b9e6107f35d8cdbc4 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6c48320f96f339b19523f910ce99a9f8d3ea099 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_33_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58f4b31dfad6fb85c2b5ccc45bcf677e612927f76550115934944b52156449d2 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a82864d188e18beead0ed5c6c0add34de2dcc97 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_33_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4416e46596249ffc4b3c593cfe0f6c23af592a114877cba1539f1d2f127bcd9d +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2aa20a049b1d0109e6d26612fc71340da81c89ab --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6c174c254e36c348631358626def6cbfa139812332a42ca83217b815f0bbab3 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4365cc9bf5d90917774793d5660d3b38cf22af2 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e706fdfad83a7e0ef1c5d45f77b2b87cb3aeefa86635cae0a16b809db3c135e +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ed5096682a4af5ac5a4cb8e1a656ab5a766aab5 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_34_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e74df5716f370aae110c9d1bca15abcd0789640b6791940dd6d89c5dc59bcbf +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4960bb39f3f29e60529c9196d2d6199b4f82775 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_34_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6d7ce7bea4983e9ed88645b6a81e816bfaa0d286ebacb6eb24a5a22f0839865 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76628940dd070707de2b56990ef29f20151a2233 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20fe5b4d1b56014ab61c435d716dff9ff5210aaca2cc10447ff9c7426815764c +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67b58054bfe345524d26e724c9aac04766cdee58 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68c9218589eb50e07fa04249c21bbc2a5e75d6d4e2ca023520178759bff1daa6 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69ce44179a8a70cce6d3c6873160a7b3fd98b77e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_35_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1629bc92195be720e702c51fe14d4d267fa104432e75307998c59f975398f5ca +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5b834e5a91e34455226bb369fdec85e7a7d1ee6 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_35_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb0842b96a280df07853efcaed07771a980128116b221018a6b9ea5ec760844d +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc81c2c85ae3476b9cfa0a4fa6c7c85caed62b4e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aa45e4110dd2559a3a9789ff621272842f3a2afcc748e7aafdb276a1301f7c1 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7b8055bfc01ebad304ec9d9441a42f0e3791805 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ab59beca9484a12802be0fd8f6f938199edc52fd1c785d875451fd397f7dc89 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63cb997f709e35f9b8f292d67d1cecf41bab5bca --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_36_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61384bc7032b48616552ce82ae877e2fb0cc42b38001278cac7f472f1d69ab23 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a93edd639667c2bac1b6e7ad338eca2724acd33a --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_36_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2115933a44e9a5c1d2e24b7ab3542446ac589d075d4af69098924916439f8db8 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1863604d3b9a16fa555af26c419e80beb2105f8f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad0e38662541a746893f7d2351a9d032158d8771eeb7f1b5321a86e175445e40 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d8e81fecb8516e5c48f604c1d43021a98f52d90 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdf9212fb39fd116e588006f5b1cea883f418d64f7a67800b9ece522fd79e5c3 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0a539a2e829b8956988e7da5ee9fa5a701c9fde --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_37_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81d0ae69c8e040b520aa8b56510db8c3c9255bdb07601bd55f728a7a612fc00a +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea28928e761eeeecf0ca730f8c5173ca8efa7dfe --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_37_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:684c5b751efb8e960588515243678cb855ff1e35e3574d0577ba2c18163c48e5 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cdf2e95291f254be81b961c2e125c508a09f98e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de8bf1e5de8a17ae88b1dafc880159dfa88f9d97f0243d10e239c489d192b17a +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dcfa5576bff5ea9352473aa06c84bf461058d80 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de230d8d4186de41713feb5140a0aeb908ab24a3d2b58786f1568bb8fd653dbe +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e205b7a037f0a018ff3a9e8d43807ad2e982c77e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_38_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6611113dd98de251969a97ea21aaef54a4170f1473a9047e70a948e2685e607 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..034991597f7bd1e9c2a5b26aadc53fb309b66165 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_38_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6753f5cd7c46cb4d22c45e8a7f9755b8b3d872ed4dfac083fce437c178ab4595 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb461801a4012468b0ff36d53abd827fc0dfa444 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bfeb8796412332658857a4f84c919440c053231c1fb335e04f1e00133a50288 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fe2d01d5c1a46fa37ec2ff7dda8964be5bbca31 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:498d56604177c5101f97cc00179bdf0fcb1d2e33ec0d170e303751f1ea57d225 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5da3fd242181f8fca1c41086e9ae08ea7e28efff --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_39_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:690f2396ba1c99080a8a7d2864eee377b8435dd44d484fb708eab63e8d285df9 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..117ad52fd407525c84a937c9ad43de6879591987 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_39_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e98de4c9c0754e70047bbe0074d4d2097be80686534cd1b5ef2b6ace37a1575 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db57dd23af3d15a00aa683ac9cb446e66d5d4931 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1133d142d745ee756ed1144ad529dc45424c803f0b6f3ecff3b66664506d5c30 +size 208731351 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46b1cf1bcf0caca154c2b8c96e4652bfc999515d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a142594fb453ac93d79d593a71a4f9f89cbb9050a30f5bc89728bbf941628265 +size 208731351 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dbd123986f6c668afce723b56f54ed1a5c10355 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_3_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c251c8d6a8139734a8b883060564b9c3117fb9eb314acf2295b029320b7fd1c +size 208732119 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10988ad0e2943cb4dd3b1b1fc13933c49d5b7e32 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_3_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:713d3f158bbc7e73620ceee771c733df4b1cf186da7d18392c71976012a4d2c2 +size 208732119 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d9923cab0b47fcf7889c6936e5e8fafdff2fd2d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea5835056aa41eb2d33577006e034fdaa905ddc9d9007094b0512e006a3f9f24 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f2f52ea05c17172b54ca3289af6b0fed7a92f98 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7e898ca3501a59f6ae1a9c4a7564db576d4ad4d30e5a74c9d5b6cc7beb7666b +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc9df63527bfe0ca90fe329bf9b4d05877ca7619 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_40_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a1861b1b354a5017a61159e09403bb3ba24563386d1d77650462ca649235240 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67437cd0c381f77bdbcda025d21415c3400ff4a2 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_40_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1975b2dd14b8b66dca0c9df91b32e92eda9629d2dca2aeb599cf97f0962be2d +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9dfd3035a19f6173d9b9c6dc4503e72a2606019 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ac5f84c29438a3fc1c966ba4b1871f0bf89d894e54d2ac39e8c156ced1a3131 +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29b76822b74bdc1dcb731fb3f06a0f6861020f76 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb7feb65ff3821b477c47249037420a81fab94efee5f067c1659a02b55053500 +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..732206719705d382ec4a99cfc977dcb6423cd721 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_41_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddb50a0bb8ddef1df2e10244aff5281b8d947257c0fcf91228f9c0138309c346 +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a4920eabde9dce441d5038864c23f18dca3f475 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_41_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adf01ffffb8e781c4c926e6a4c1c762678f63038f7066038e08c40306a162a8e +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08da624b19538bcd95eaede83a0295b12a452c0f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9544f125f41027244aa429688d732124c38ae8a91e69862290d37ffe5f310472 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d733346d0f7bb8ed630d2905d76c0ff29d086452 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24824a990efce18fbd5decdac027eba18417124d0e7ed3a662aadc0d9e4cb8fc +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53742d517c40d8eff7062739661681382f8d79a7 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_42_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b1063fe79a94bd4074b67b3a4e5c422006c471b3961927f5c50f7a1672b8e84 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0380be1b2580c5877849956ee2a64af2848e5fe --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_42_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6caa77993f375d72ffc30b574bd56a7f13f610ded3f3869fded16d52942c92 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47d5beb6429d931d79ed91b587fdba1f11d10aba --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2df552c26f0431a0810ed333b1ff3277dabf974d8561e2f4006319917808b578 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee1ab3c6f1546fec082d464d70e11ceb9bfc2d2a --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db49b2fe65dd808c2ad52d45599048eb537eb8830a431f08680b84fb55ff454c +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f41154d2632396b00f4a23b2e790b7c9f321bec8 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_43_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27d91a075e3627e53bb43f82cc8ce8daf44a05a445357c7e4d18862b50e82db5 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87e4f254a513aa650a3e6617b8a1cb31a240dca2 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_43_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6500c7de27be012b2b42aec33ebd058ad5f2db46bbc6cfc33174ffdcd6ab1b9 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7cad6b9252cb316f63111881d6f1d7ea81173a9 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61a8f148135f3e87d35475f7c2bc157ba71dee55ef7baf5e30d2718b877225cb +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15085b6b3aaddbcf164a84c3569c6a640f45fa72 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:953a8c7c292d92ddd08b6b591197b166edd3bc53fad9617ba7e410653e16e24e +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7c7530fa8d480440d06344a876043dc5e793b41 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_44_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fdf96d4a2dc96c26d7668a0d52cfa9e8f894bb94013346a9973f3991e1d7264 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..119a4eb9fce49d1d74688ccfabbca293b9681531 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_44_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6abbe21d02b27950227a17f23df496e52e8644b5fc959a091e7ae593d3179af6 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6a44e48eda9d32b2fcc7fcd7f13e81cf0f16e39 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:087fd8b1c65ed013ff18603d7e37704845a73f0990379af47fb2262ac50ab69d +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cf331d642bfbb084a27f8801e18621e7303fb04 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5293c7b403a834c5886cb279df36bc91929e3e020b13b56ea7c9e04b59661269 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47ea7ed00766cc0397244148b8fe76a4358b8d91 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_45_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d94f3df67dc33dee9e07e90bc36f5b210a2d110cba2d3d9894d09aca9e99e55 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c111ff1794aca031db8c3a6d0a80b3d75a36adf2 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_45_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1cdb72fb2cb9bdebc3dece20a14f02c91318ee0b3653e07be3a1ee06d52ece4 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b297b3f9c78a4c1e213f14611af8a15bbf41f76 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d262e79d5e6b59acc7ee21d61a17a9b0425b035f60e072ef63a0f6311a81f839 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85c2ae265523ad39c192053461a12d1e3fa8b572 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b5eb1e847043c2cc091532b9027a1f9ec92535b26db4cf4e005d4975aa11c4e +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14d792116566c67c065ab288c03b141a3171feae --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_46_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33ff3da23c323c53d74349f6e4a368f0e4717d37f6803ec41bd69c27881433f4 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db59410cca40a702ff9a3403ec413e690bc1f63a --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_46_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a883fe920eb9691151a706f95e3dadc16732d54d6e0b5ef6406d543d69de1a5d +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58ad26141da2fa769c4e3f49cc178c2cae1997ba --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f6943f020b3533ac2bef62a7eb3778aa6687631572e7eb9f8445daf95a85c3 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50b55f50118018cbefad4375167618ec92a33234 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed38d058b79dc873d1da65f8fad83aa29797718229aa80731ab69a2ec3fd6117 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c008d29efef23c449754830bd8c6ab77a917b9de --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_47_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef950e4e7b90aa24d67f7a2075b0cb2abd20a86a33ddd21bb7e85e0a62f3a19b +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a49dda2cf2a4445a1b49198d71dcc2c3c06df22d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_47_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:740f2b4d829fe0744a362640efa0a6a05b8b1a29274718d82511e62a9d8fb8ff +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16668cf3737edf4ce11006f3ef9dbb945999e9d1 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a33f428b867507e0059f440a502701bc5f695d0c7cae269e79b1b94678673a82 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bff9e3c72b8abb442e28582d1fe9d883bb3f7817 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2de1b8e4dbeba29308776ca44716541c747d99070623d4d83d6561bf64a1a308 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb790c8f79be5ab5b21cae192ecd04ec784ba90a --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_48_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:601d7f4183f9a06981b0caccf1aa538dcab9244b9d7e6f08cb9a2ddd88ccd4b9 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e6e62a70c6bbaca300695fc8da0e2507530eebb --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_48_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:517e3b27b02ec0eb83f966ef293a158548a0036dc2c24265a0442bc2c836bab6 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bae21367e31a9f37f2bd540e2d2d09e67b9e9a3 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdf1d20047aaebcd7e1568a12b904199d46aec3b11c7b151b97987b796c1cc23 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..014d2262d7d2048c84150618fa6a2a2520f98da3 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83991f6f40118ad1ec145946a8875b245e24a0650c73ec4655eda53396398d04 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3e54173dd47cd46887238f8fa54c727f8e51eee --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_49_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8f9cef93c03224701b5c480cd4f734bfb333aaeaa1c90a2357b6f84b8bf5135 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52e25d1af780cbb59ed27acfc64e9e05855a2c17 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_49_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea18d85df5d2f6384b076a294cbebfb40607c00c152044d89b3ce09af2c27bfe +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56a1f075e93023720e1ace6b4f5d25a28ca3a9a2 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64efe937b56c6983b0e787fddd9279522ba50cbef37003c4163b1d14f3844878 +size 208731415 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac3723da31345913e7fc4a50bba24ad9eb8e5cdc --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70ea42abe2a25aa32e366b4be65557b3e3167d5c91ae3a3f60bc836d7371d23a +size 208731415 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df4665475a1bd4e39196fa4741df1282574d0ed8 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_4_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e4c8205e48d4bb4a13c79d76f2682be2ee7b7e811ad9b84d726d05dd83ec39c +size 208732183 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..216045be40a3ac7f9375863cda9b305dca259eed --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_4_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c47233558063254831a2740266ffe133857cf5e1104abb4255dd74a82f9b962c +size 208732183 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..796e6e12b5eda63435442c6333f1822f903bbaa0 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfe26e3c5d497bf484c279f8752252e8d56ce88b2a727ed5747f1d084d875e63 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80abb63bc919df9d9073d2d294c28491da4d7a0a --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:695fd101c16f477a928e4b042ef105e138745638123e447dfef45ad0ac4d6219 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..823dd33e5a21306befa8977af68d0900ea8415a7 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_50_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39797688218addd2df2f74b8fc827ddfe78a34b63678689e2aa6da6f6655573d +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53c14fe6972439fd16faf5bf467125cc3c51b413 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_50_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8bb049c3dc746426a4f2631df955f3b56b4a06d10439903dcea7d971297fef9 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6031dcb34661bff28690b5c17ff3ab9365aa04fd --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6a47dca7b937bb5b0711ddd299f0d9698043017e4c5dfcdd155f1b2ea7f3da6 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..652e31ee22269a1cf79560ecf1a2cd5b93389190 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:611ed72e97c7f8b27b35ca761b413530c7e1c9242615c939fae1f6b107707cbc +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83a57ef9414876caba2cdf8a160f8bd6439e853f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_51_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8376c03541cced7add66f05cb907e5385fe96c0f1a4232f07b67acb0527da19 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b1c42fd61895242908c9c561643f0761e84774a --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_51_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:865a3dcaf81f362c52a0c00267be2b47361284635080e3701cd7a42a425e465b +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c409213dd3f9358fea806800f1c5ea0d3e1564d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e98fb291d3b76dd87163c9f0726cccdbdff65d0e2ace38cee47594b3d5d33bf +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec131de3f89d518e79abc114443fc7e81a88fd8b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:563d8308e74440368faebd142c704da0af8cab5e0fe8cbc55d651b25230442fe +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61bbc094e44984064460911d81a211a6fee3ae3b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_52_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99081efcbda40deecc3d990825c631b266d545ea64198dbb75a3022e676de9aa +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cdaba974404db83fa23c47d7944e7b6a511a2bf --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_52_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf443ac2881b5bb4105ff888cdc97818055618c2d1d5bacf76b2721f80d71349 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4487592b80ded39c0da17fbaf20c262f783c1495 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d243d46f670fd3b953b85ea96a863d96e197406d11968f12343b9df88868c2df +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..355bc2c14e7c771068845b5a6451b95c4dfcbc9d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d94b87a8be7a86c6235a671321226ebdfc968c491d565adec9adf5de5835dda1 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6c84363621500537f39c6c12891b3af3032062f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_53_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a93ae3028c9435fd7e82427838254d1645b71c5197f8dc5353db88a2ac5ce22 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e4159ff6c06574efb4a655dfef3c19254dffa27 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_53_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d64ae353d8b1d870a66564ae118baeb153fb1d15a71af05e9801140f83a22bf8 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1e396c129e09879006f3ead88ae476cb4c9266f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4255dfa7867328ba3880d18e9913a6f22f5051cf9ed556b1c4db2c3b8ee2c402 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..793586cde8a85a205675bd397b1c1b8a6486c776 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a634db8d2feb90cded336358ad038fa543e6b070e96c1909c9dd8113033593ea +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d40fb386cb8b0920ca29f41f63583c045d44bdb --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_54_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa27841ebcfee25f96bddacada0ef5c28ff7ba1842d4a143d602b9e0efaf7ad1 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7962bf757aeaee2d42a54beaa60f44ee858abb37 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_54_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87669e25b3bb12a46cdda0e00e17937127bf2c6ff2f47e2c9f5276cd76a8cc7c +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b44dd721de2a6054cebc873322e86d7558b082bc --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e658b0dc70805e6ebd3f73631db3a0570d792f466d75a7eb4d7ea6e0bff68d +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a039eea73e899850e11828fbac7fc6d77fbe8b4 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a022ee99c5bd5ee7a562dbc95dae0f2d6964478e6d969a81eb70881978ec953 +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4867a82abfb216185e840dfcdae113f865e40fba --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_55_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:732c02f50ef0289f171074183217dfb5dd4212ab4eb4333ff7749107842d5eb5 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..086d0e4db1ff2c8285eed21a6e49293ef241bb0e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_55_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e734292ea7922f7eb685ac26919cbc5e99b2ccc8f9885469ca58131e6ae4d3b +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2abd893e894d0e31e9bc5a3ff40446aaa9da25b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fddddb28271462e43d2f0bfcc600ca326aeac7f30845eea3232a379060e62644 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b21872c86aa91dcc66bc47fa359e3bc23661c38 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:992cc81129cde6af835258f4044f833e71e9f352205299a7b26aaacc362ce382 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ac2c070ff7ca5d76b43dd02fd01fc70cbeaec25 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_56_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62530e8ebb583f601b64fadd3818cbd946eae2094dcff77886256d0da1367533 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99a84564f393ef596f5a5eec60eca69da24fdc3b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_56_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83912b83f436d3a651dc227988b6faa722fdbddab29b31fde4c595ff55a9b186 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce613832632ce55500acf264516d069533c26daa --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d91b323dfb0bcb16e42c538662205382912b5d1af612385fd56e5e98c13d015 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1ed44a42bb0c66f1e61626dcfdc00d61bc50207 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6ceeecdcab5bafc2a914dc47eaddc1fa8c20cab508597cad77a706aa145629e +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d941b2f44e31275152fc4f4482ffe4a27e9ae14 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_57_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cbe85f9b9449f0089aa013677f955ceb6db2d9d103c736a01e761550c3d333a +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e15e27ad8a04b9b72959a08c6fd6e8a0d983283 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_57_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab06edda11d8dab32d4a17e9146f4ac53d40ba077c150ba930cbd0f0b68c2b08 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca7b80bd557f7863d240819af556e1305a207510 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:820eab56068343ed1d4a8a2cc5e8a80229110f0bf3e34fd8640f0da097b08ea8 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d82632e27f0a09adceb863f63e014825eaccd98 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6582a6b7fd5793d669183ade9dd7206f4b55b47c09d807d644e20f0fe41c3b0 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ed7464ce1e7e609f6cb53f40aa4e593c95dda7d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_58_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eaf20cdc6a8a7d018f8d54a0c54f3365a09bbbb8e139c7398edbc61d53010a8 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd90cc812111271210562d18a7d56c59f2110529 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_58_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0f9463cea4cc745c89d02f9c4e24afaba89f1ebf7c693290b4872af19cceda7 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c691c995076b3049736a0af90c9fafb3c23196a --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31cf7bf3faeb60c3fd3c83199e36773fe14ef8fdb7e1221e23f33a0dfcfa0097 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..629afc29150ae3c81c8b08bff700588916e3a548 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6542199b1b7f2f122de27e78da07c40511f530da22bd1cd32843b905abf49c94 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1621eec7d648ccbf7383c86e4e2ea476156dbca6 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_59_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:953c412b67bc4c52cfd2983785e1b98e18c223646774b319ba78dc92a8348191 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b08d517908bdb9c0ec65f5ccc281856029d8716c --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_59_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ffa06db72fd11c271d537bf49122f7e8e94a81e81a784c0b32ef9cf0f942631 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31e0e7742e10dfc6b320015d40319f2c85e305a1 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94250805ad6c4a9976856d7cf4977ec8b0d396f93400f336e3e744147a4b5053 +size 208731351 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e31452feacd140080d2f87d6a5a8d46fa42b0be --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef5117930cf1f22eb87c5cb43cd427feefd6aa4cb82e58c7ed6dc13e690f516d +size 208731351 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67b42344d5a060452f6a1db3b90dad878a58c69b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_5_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e87649faef628d7ebcc1a35de79de5a90131262ddbaa01d6a8e60437ff209a0 +size 208732119 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ce483907907b70ec6248d72a6d4bc35c796e4b8 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_5_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fad842c721f46fade21cbf0547b375818c07d10793660fb560cb70b65a95af0 +size 208732119 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53559c24bb136d3ba2029c2ab95883ff2c887e95 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55f5ea10d32d0b4c9400482dd7021fca98ad1b0fa8b9286040ecb11997440ee0 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38ef01c78519ff28532233d85c0f4abb52b173d6 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0d3c1afbc00b67b028048bcba5dfcf2cc2d2116d000863f0f4e18f0e0ff21aa +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd8fa949497bfb2e316343cb28b42cbc3e55624b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_60_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e39b15dd1ea4542b75f47a78c319cb744612d5db511aa7c73f63d1bac04c813a +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08a167762fc871b86bff5c7de8948f884c70e3f9 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_60_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b0db95e374b9ceb2a4dee3bbe83b8eb7fd31f728dae1df88f3dbd7059785ee2 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e3432f07af5cb775a2c5e01b58db50771150f5f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c56cd5c698be83c8e1787a5c42c95592a3b681e0764b631f851eb1f72c1db0b +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b01e82b66e4bbf9fa534b32a8c97508d9f5ab6c4 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5715488f83b1f5b44482a5fb5dccd281900826d3dc5db2c7f9b3bd9d3d5b9a9e +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98e9de8020bc37fc2b584ee28f2b55d04194a428 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_61_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f39cfee615e8054e42458c1c476a27681521e6accb8b91510a4e591cbc117558 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a699a57aa119cfeadf7eeb07037a0c129be3670e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_61_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d7e4f0606976d13f64e00be8609c621220b8352e480258bffb1c35a50c52187 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58b0361b48e560f2da24105b17d98cf65774deca --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdf682da23bea2adde4329f5694c466eeb007bbbb286feff638f31e3f5b7c237 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1944c1d939fb209db7101ebce4672ff233b40599 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1228cd93f9361feb32bc54e97921cc0503140b8e25b5c7a15e16416f53c4382e +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbbc056bd3123e083ffc096413e4e5f198893791 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_62_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee0a7e9c92f8d145007058f0bf849b5cad5018d14e86119f2f5e7cc2bb648f6 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70660ff8e811ed8af679957fe577f9a1010b60c2 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_62_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a27afe25540f06d391fb12b8c6d9f69a3fa69375ffd95cec3b122638952e058 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e36c56eaef7e75027b5c6ca460d32edb648b69b7 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ea58659a5c0db35fb3f4c2d11f3868d760be77685ff46839abaafcffb24494a +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4f5adc0864f2dccb8655ff30d4de8c2dc6cd2a9 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d34142259ad044a5db32bc89b33b895ef39387b948968561aa2e3c1038722153 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9432a0318e4286110aefaf3822b5f75d33d73ec3 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_63_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4aaebf22580fcdfde6df1eca6686ff29a686ed3840a092cb62486179c277fbce +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d95bbec1f31b59c7f9989bfcfe884311686aa8a6 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_63_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25d43465dd648aa6aaf603b3d182aaf863ebad50f0c1c239d07b39c3a87c0db7 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3674862d434d0bdf135e6802b2261ed52126082f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a06a7ab57e4b343f01db3f438afe117c23695c7c32a882dfddeaf48da700a6f +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dca4a4d3844491920bc258ae92e651176e748e2 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:657338f3e9f6150023d0ba4d0bfeb8a59c1f3f915f43a6795041b73345c2d8cf +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58aaf991db7229964c2b311759cbb4318287ff17 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_64_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0020f3d98f183833823a45dd4202b8f61811fb9b2bebeafc5c5fcc54fcd636e5 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1740bd5ea52e76d3910f7033a093396149fa4b85 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_64_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2883ef45282eecac56539c3fba77ae09e9b4f894cc78b87565d37e5ab2c343b +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86180ef2492f2d65c35f68e84add6e88f748743d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0a68bbe3c25841a8e5e72b5df1d654f40f0e48308c0929ec06eba73138d64ff +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1bd5bab94e8cb5d26e4e4b82c80250a431c4028 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78ed3152477fb85f867d95d934a67d974268b3d7756d8ad065b649b009006c98 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a397c278f0a8c8cc1835bc699ad824a6eb9e7b1 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_65_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af2291e75b2f7f1abf40a059e8af4a0bd03931443193bca31e512d6cda155508 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec477d79aad255fead6683bef55369a4707a2b84 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_65_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71f089103fc21679c7951d4303b71d8fb02325ea86cd6149eca7c5a9ca584279 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31742e7a25c1c6c7f5fc9933c09c4cc2fb15b46c --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d45b8fc31561eaf28b942127baa065b4620263b5cde3127d67d59179d58557a1 +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b03c60873b21b99e2b0131e8a5e51a49c2429c3 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94cf110c4df32514503c3f6d75dd4484ab6e65ea8659285067f23b5af6829c3d +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..189a8a0de430471e561a9b9235968f3c797f4616 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_66_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c367a490e44707e0a6b6bb70123719787df2dd232a1aab8d4573a58c446bc91 +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8eb7404ad21bfebea4cedfe922c212628d56cb7 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_66_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c69b40f2e5c4e4063020a74d69691eea42dfbd77bcf8fd15af9d616f6557e551 +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30230a37b032cb22df477138737b689434b80007 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6f530e1b7b9a78b261a7ad41f4691d7e64464a9f8da2536e6c7e31f67763192 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf662722cef2f1a19be284024a81f973ec5b491f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b08e3c4cfc849c662efad681d2bd546f50b6d93a171479bc49b0796d075e174 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6d95c0f41af2ee538d48d8e6d2ba98224427994 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_67_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93fc092dd9034a0b2ef67660725b2a9a54b2d556306ee2aac6db0a9955a48f68 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37432a52110969a6dfa1bca0e5945b46adf62d01 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_67_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8766f2ab5885d001a3f9a850ac342b886da79bf54717bef381282279cdcdd406 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ded2e06cc89288aefbb5b9e884dfe650eae28a4 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f24bd6242db773691f19773a56c196fac420dc187b3008c462f5e0fcd466962 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1597be7ea3e7e878826051a26f182f52c6089883 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75c8834ad409751a0b31f94ddfd42f0175826b8b3689ddf2f8ebee2be1d8dc9a +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fc3265bdd143bc11008bf2ccc6a4a842cd22449 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_68_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee2cc39b5390dd741a85ac5359b0a740bcf07f3613f233b5bc2912132b8e0145 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96b93fb9f23694560f03dad6ae4e5d9bf90ab794 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_68_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ab62edcc7fc14271ca57eb6087e11d906e803c6e335575d00de953c114a5ff2 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dca554587636669177c6295ddaa4a25cd2d8d80 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6931638278ed14b52769012c95d89e181de6f303a2ab79eca695e56c7b6b4619 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c82e6d63b391983a6fd58dbd60ddd04fddad3f86 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:106da2802775453caf95dd0fa6c710771f52da5bf1f21cd2a2bc02273814d5d2 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0772a838f4d89b5f67f6584e3e9d29fb87ae187e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_69_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33363439b21fb23dc5fafd379214957af0ae023c96322e9ad06510310b0379e7 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..973f76de7064f1fbd5b633714fa4fe264b4dac7d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_69_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:846a2bff0342d1427858b25fcb5f4d7d36b4c295d915f408bb9286d5e60f7754 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..226fbf4dc331ecf11fc9113961a90a8fd0064a47 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9af0831a5c4515485b983ef289392b0f604a90a7cfdce77c2ac462bdd4579acf +size 208731351 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb5320114df3eba0731120347e5da7db55f16a2b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eee76413663358a45f7b520a64b77bf8ecdcbf6f55cbd4ec448a26d4ac14597f +size 208731351 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe33bd4426a8d3cf65cf9e9cb40bf1981087bb02 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_6_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96bf808a196e37e501bcae21307bbc7d72edb426069e6b5a06cb9cbb6ffe8516 +size 208732119 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a054dd86564c2579f83d4e1c30fdc325af6a4700 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_6_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b3f019e13244f899d581ac1bd582a1344f26a38e17452125bf49be1d58fb8de +size 208732119 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..383528b66afeb82ab218f2e278098164612a6a40 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5b946b103d5cc42b6118594217b6200bb23422afb55076b913f5885f5c9e1aa +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89f8247ce885c7e6015516194c481d8a7392f19d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:766cecae0e4420a1f5db4b8508e0c4e546604c58c23d9fb9a3023af725c48338 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b83340d513667bf8baeafa622ada64fadff1af1 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_70_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e134d3dd5ddda5580d5b337ebe7877b4db2da34c646bb58d885a27aa48edc308 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a29358b05f5bfae1b2e5ca94cbf5aeee4aaeb5d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_70_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35089db2d2b6e69acb6f0681c6aa4a2a69c3401c5a406c86b747afcb38f4fb2e +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4158ccee944a0a98c1b311e7de04a4e04b018a0 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64dc7e457e66a43101637701f8dd54bc0d1a63acdbd1c0777af9a3eb88b955db +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dd8ae166a7db596fb8fae724618ab56f95def56 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:259d81e166a5af9ea9acae8fdf232185b2955ec29eec5a10bac5344040e886e3 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ee0ea1d7b14769698a6bc487044580359c448fb --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_71_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c26eb2a927b1378f5ebd521387be2b0d0e64a23545c52988ca7d5bfa3fd09a18 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d4a82599808926c0c452ad09b9c531d02aa1e14 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_71_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1a5a1f32f3562121da44f80864103fe168a38b5a0e5291b246fed876e3a6033 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dee4fac859b009c369e6195e658c91ad138b028 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3e39026430dbb67f0943e6b8d1b3cbdea215abc0adcfd78d276af10ed986b69 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a91a5fdd6b8f705ddc273ddf691fb6c19340851 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fa4f52761412e7b4d1128516f901d139f6744585c12cc01f37d91e19d5341c3 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b72640992379220df8d124e9b27ed5a82cf3870 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_72_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ddba787267aded5292475da311c40ec6db5da41398c82df1f6fa5cac81d029c +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24214f64580c45b6763424485b452e0f0c907a5b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_72_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fd9c8ed7f6aa3a6c32dd7a15524a29301f2061be588e86a25aeabc900fb92e0 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7459dec2e7f822c856983bf5f3979c58847322a --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d1ce7bb8aa16561db2c08c52c1f18487b8096c99d6cd996234ba82d9ba8aa1c +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2539840279cb106543a806d45817d7f09b67aa8b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:841903321ce6ae115e6479acaf7179c464af81ff2d2e84d0f504127d96bdc4c3 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c34ec6b3cb9882e063c8628aac736f37c8dd9763 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_73_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20ad64afd07600058917a4e660c97d45a749aa24b496ae8f7bb95a3b6af6099e +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59fc3859e75b6f0f3d19ece482077b28aedf90ed --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_73_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a8fd00f818a59a9462961688aa8ea63e87eaffc1742bd95fae459928d4f21b0 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5a20abd24424c65c50a2a9f3f12be5a07f807a1 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:097411a0b0f96ddb7e2f5d3098ef2b2bb5c20c1225ad4a2b0f521ebad6c2fd37 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2b7a6a177e391a83cf120bef7546056dcba90a2 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bedf8d1d18d7f0e78a40eff113b3c35298be2e35af6211f6d09e00a3fda3bc8 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff3a4b43602b8a3b8a7aa33a8a34f3516e63e9a5 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_74_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a340a1877f83fc98dd4516ebb80d454a814c60794af486eb89407549893d8d8e +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad77bfb8bcd2ab87506f921ff521020a72f35848 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_74_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b57d718ebca926e4cd5f2f242983c5723b39bde5170ddcbef0e9cb4a16de6c1 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b8467e5b78d7d41bf849ad13db3b7f24e7f7cc0 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f6f6e3e4e9e0a496d04d7fa748431ee7ad782fb5ca509ad5765274791acc90 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8d47d06ae2ad14ce10f295fc218574d4fb1b00c --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8403d0a3e97834a0139d71fe8ed7cb9e56900c07c2520317abf0ca9347391aa +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d761536b1f2f6182e0ab5857c2839021d3e9d6f1 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_75_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2fe14968644a0da7e81eceb96665996727093a603106a82dbf2ccbdc1764f80 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a688742248c2458c8b66e6e9e1acefa6e898a54c --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_75_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c7eee92c0c79a6ff068fb3ebb205eb872a7e7a6c8a46c7825aaa8112a17fb8f +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbdb3d0dbdb49791c2f61b56f54b098c41c7cf5d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ed97fc434686b88451046bc438e9a91020d0193430e7f5cd5bd8351a3d3f3d4 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2848516ffc43ff8b5ed05784dacd198a7ec4e664 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bfb42acd9422b378ff3e25d85c309ed3931ec0540f90ff3e649021484b7ff10 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79adc6abbeb2d68826f422eebb94d393faa264f9 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_76_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:707d1f3f9a45871ae1df9de91ca50f01a0b82c8c03d456a1fb2924c53052c631 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68505ef28bc788bb07b128a145e0255732985825 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_76_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2aafbc2f957f6bfcf1ea0cdfb02ed32ae95406cb5f2c34838f7182e619a55b3 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..878f68b0501389339b01e8c70813991fc2aafd17 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:610be7c3340b9f0ac82730496bc9ab2631349338fd37c1df3ba4e551b691ff72 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a7e859c1fc23bff890265e722c7ebc18cd65bf8 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4608d9e4a62f04eae810581c11ed41ddef973c450a9c2525cbfdf3a7c90d6a9 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c69b47fe12e2490fcf02f80b63091193a8371f1 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_77_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a97ff4619f5db0ddf55bef733648fd458e650c7ff0cd9f90613bf99ba32c9890 +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6aa24ce2e426253116a3c17a51732a1f9594435 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_77_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e4803ca41b5355f6d19bb4573fa5518fcbe7a510ccb4185bc64d14a568426be +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cff7af86e8b895b38bbd54f104c2328b19bd3cd7 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12e717f20c2341815d3243bee53ac65ece96cb49ed6a88558974e1887a6ea877 +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eec65eccf9db33c54e30a826073b9e33e8b10bc0 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20e304756d4cf42bb47bd24a966978bf8d385be467308c6e4dbc22ca42614734 +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c256a92c8593e7de9d27f477a1206491c380aba6 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_78_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45a81417dc653d666614e22d59ac2e016b9a343825f11719412a35ef8a47f11c +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08f1ebfcecb72206bd1584db08b2675139b1734d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_78_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32931bf7e2a1cb44f12685fb40b315148c6a72f64d94bc4a7f005395995dc560 +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..236e62b1523cd649c8b4e7d1a3faf0e1a9bb7ef5 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da76fabe515fc7684aad9a10cd9430085112f4ca42073ec0a0a1c9e28d1036e4 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80e83235dc6eedaf3ee3be062d83d765cb6e6403 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:853de3907b331384638c394543b1b2481cb9856d8e40cb90830d1c7f4bb8ffc4 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ad57c3184d68418b11aafb2cc2f1af70257068e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_79_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7df6bd9401f49664beb99ab6a21e5e88d5ae10b61ee42551827c7139ce277486 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..480f9ff33960967a2a60092d08d4b7ac48553c68 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_79_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16d8f525fb41ec85ef18ccd5e74e0ee35c70e538be1671beba32bf5bc3d70cd1 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4ab9dfe0ca2598759a5b04e84b70ad538449d8d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cde28153d5d60727c54309a9e3c87c3f548241c06e1dc16d10547ae00c23ec40 +size 208731351 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a16b671943280bf00e91f8d52fa20a6d58bcfa36 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a87579c0e9f0cdd0df399a4d61f1fa8e69ccb592c76ee9eff5d7e13e40a86506 +size 208731351 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a65d2fa1d9d3fcb50a6019f45dec93042c7da715 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_7_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c606a31b834bb159007a0568c86e7ab3dcab328eb6c56350ba3ce4b0fc3b6ba7 +size 208732119 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc2198451dee4def9c7810acfdd73059032634d5 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_7_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a40e5486374fd63b2c1f410013f5c2fdd5084c8535f684e8e4c925562414719 +size 208732119 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c75dd58b79774cf259a361db5cc6b257c5db20e6 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa3675d3c4a5df14634bd85831cf9d924f34eb8b66d04ba24822a8e8a3aaf547 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4e815ebef7c6d88989097bf2ddb82d40720b706 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0785702c57cf8e8090a1ba29dac085a52a176f2b90768a83634ad8d19a5e45b +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66d8b4d39aab809434d8b13a4d35e905c0635c31 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_80_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21efbf3864f6087dfacc66e72baddeb67e7f41c66385bc4555508f9bdfa20bc2 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4cfca16131f771e1fcf3e1c6d18e23fdbd42046 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_80_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b9908c6b837fee3b3c5b014b5752395856834ae490029afb3a0c32f96a4c065 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c6c0aaa38d4d64c44b3fc799410f22f4da6253d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0e2105f3a99e47f3b4de1c26c8efb97d80f9459376825634cc10f9c75147719 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..439ab3c923f96251eb921e3a28692b9e03ae68a3 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e4be7a8d46dd70bdafe1564e81c2e957f0b9a2cc5fdb43c9cea88b7fef6240e +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..021cadabab1851df6c985f7be4d9ac8c9e38d5b1 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_81_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a120b858f324dd1b346e543f4ef9d56fb0fe374e07884ff271fb24d4fd0cd36 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80ff79bf2204274abfe48d8b2e273560d0f3a283 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_81_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a43fbe6edd9975b38e5586cfd9c70d6e46606d836c07d13d138403e8727ff2f +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71472b576cb1c4b72eb2bc666bd7491b8ec20993 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0e6df4d866e1494ff93a43ebbce050e8551bb4936e1c4c3a1432f3977aaee83 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6164384edcfb6c2b4f429ed9bfb05d665645f8e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7dc2d8165d555cfaed5a235051292dee5bead239e72d128dc43c7a21c41dc6b5 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3b94ce7ff681ee1fef8e196536ae4f8a7098a7f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_82_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d044c5c9b3a2a5677915c872d6ba194173dc0d3e7b80a0398b55f1a7f6007d41 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa95f5fa48486a5024d24e6e69f35a068b1f53fa --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_82_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cd082148b5714239dc451ec1659d9cba4414ed57c4d8311ecd0634367a50598 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..479fa3ba0da85c3db5ffb11e4818672a519f65e0 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10bcb9820402eb1e55e9814c27e31c28f1386280979c7a615b70a751eb281a76 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00b61e13f9a482d3c9f29ebe2cfc1e652bc8041d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9782963636ee3a95239a3ff8d8bb57f37c2661af29a94c36b88f1c9d13a74546 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0f3a779da6bb89789790697c62a62f0329ecc45 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_83_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c202de28e86339877afb431ed05c84ca8df3f7a11106fffeaf45f96ffdc8858c +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9969c3171ff3490a41ffe2531a9187a7a965e8d0 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_83_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f4ad6f7dc480ef1cff098f78dda71f3fbf8b4cbfde6321df31f3eec99950be4 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c0c72bf2e0266a6a3e727d5fdeb9768c1b0448c --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f3ca972607d2a2a7e930e3130296b889dab46b76ad304c0227d367ddf2e2976 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04c7eac1a72ed2dbbc25460578da83924708c270 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e1fa3ce04fffe24e532ccc2f3367b1d56e8bc6a5b9e93692af1ce2c8c6db262 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d31e655d0802f82f718eaa2b9e9510120614f9d2 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_84_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fea4fe9c13607cee600d9267c2f0b0baa9b15248abe3987b5bd2519c1a74c0d4 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b60b9b232717a5053df5a1386dcf1332ee34adca --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_84_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:374bc569f771946beca4a2672b6a77df4f4f48d52044fdf098e622b0fd3d3f31 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78e7421552be025016c80d25438b69b31cd5b056 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27d07db36034c66dcdb59f8f6a206e8954e236d2e0176251d3275a5a6783db51 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0d5e1e14e55504d3ef03f55c7342ad680f150f5 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8efb53e3cede2739050458b3d568b4a0e0994aa7494ba0df318df9cd0611478f +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5626abace8f77f4e210d01ffa031ad6499270d03 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_85_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95f92c57b7c96d6dcf8c1e93fe6baaddaf0852d9fb0263d9362beac10591a693 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98331faec80aa15c0ee9cfa01bfd103122be9236 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_85_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8e372ff92d2965ec7f39011e77db8cb7dd5c9d64fd29778104e87cfa427d05a +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4b0138e50ed44986447adae704e27d6e3d87acf --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be5a0a7ca5eb23b6b732530bc4a4ba443824b09ed886f60640484e1e29971487 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2298e216f97b23c4b2fa4bdb33598b7a34ccc6a1 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fac4511c2b7bfb9a11618348d1dbb30362f5605fe5ee8f6d0b870f2b8e67f7d +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5a2d1c93b9cb1281d79f0b7c1a39bbe89752a86 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_86_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2c8ef74a037cc197574639aad71b720b03527d16d1bd60b95c4b5650ecfb5ea +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ab9eb8cf892af827a7f1108aa7a3211a2db9a47 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_86_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec1f68e11f36bbd066afca326bc9ddf516c45538f8a93763307253992a6d04ca +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..845c5fc65f15efa2b2bd6308f70f9fdd249d4f6e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a4121df7b2b69cb72e2bd0cd5f101900a3de7de9e5d66675feaf816cdba98fb +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d2f277912e8a6aae6a7fff8fb16d0b74c220b40 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:944288777d82ace3b3762790e53c276cafdbb94cfd98e83bb84fe37ee21baabd +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8c5eec77c118086d343d9319de999e95f238a3f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_87_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ed898304a18681c275d8876350d99c07111a73e09225f2d2da8161294453fcb +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c5b098c8bc3950df87e35a3c2e644f0cb645b8f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_87_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:445b1fb8573b31ad2156382ebc2ef3aaa6a7a1c178868ec71dc5a75428a892cd +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..725fd2a065080e339c029ad42d9afa2b98d06fee --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c097bf55c0ad7cbad800e1e26919b19e7278d8ccc37a345765a03f3358e16f0 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3eb175d3c56bba57969cca95c6719b8eecd93bd --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e46c7e3546404d315e9621c90636130893c1d3ec71570617deae860fe3715b88 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0de91ea694de1a9d1e6d7ceb71f95b5afebb5b7 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_88_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8f710fa301bc8096dff520a0807c6a015017f1263c506bc9fd7265ff6bd5956 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb1b61b88b87d714a035b1015da6b6f9e16548ed --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_88_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc6e5d32671f1ed6f171e03651000a3f20f82902bc2846f35cd1a009b6e84b9a +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8ff8646b3ef386730b51e9187dfa0a926f459dd --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45de158ffed7860ebbeef71693b30083bcb076675e99b4b6cafe5347c6baf1b2 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a2999ecc8675f4fee02f467168d1d70469eb71b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f201751580deb0e0649117435d81bad4c729464b5695568c942d68bf77ce4ba +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6699d908b808f2b52b90ad2b1c844c66a4694c15 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_89_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e58ba3afbd7c4691eceda444eb5b787cc761249891aab04b7e4f26c6ebf6eec1 +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a80c9dfba4b7755109f46b0f3b938b88bda3347 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_89_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f48a7d0ece03c67c265614cab82629d08e6385274f0e6cc618da9a4b14df2d9 +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ad4f49f24df6eac9c2b5c8228d690435083f93f --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4da2ab72ba006ef0b379da02f0add4b11ed25f972b56a9aec05e20fd9d6dff53 +size 208731479 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ff58af268938564af3f1981c5d0a980f4b500a1 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97c2db6b71da627269355529b2e353fa53d66c96378e4d860887adf56837d354 +size 208731479 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71f8652bd2ee6f76ef2c1a4c90a60c9e240df528 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_8_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e8bd206960b0f4c0872c2823ce924aa3cd2f8839db881267767c944b68177db +size 208732247 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45368e6afdbd607c78ee403dbef42f817385657e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0a6112daeff0757983885da4693c154eda9a9c2dcd1ca93e5cc2a01070120f3 +size 208732247 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..feed6580fdeef10ea8b455b0af06811660b5ccfb --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73b9a9b7ca3982ee163d12638a0ead2c35efb86136dc9807a98c77499fa1d4c0 +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f297cfc1aa6a57999a2b3ed36abfe7f839156db9 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0693147907df87d323e35d339e150cd751d26b5b2a01620e589ae3e91feb440 +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdbe874d5862ff27e12ef6679fc490ef672172bf --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_90_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51a96cda3fd8c62c7bb07893b057560bca4f13ea377863adb8388d6e3a232325 +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2a41646653dc68452a4296e4c727c9b90f30d82 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_90_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21de213805a06eb62da1993ffbca0392d489bc6adb2e4414b8a4707793c6fb95 +size 208732066 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..999637e0ae9736f84cf70740ff7e3e57d88733e3 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dd8981cc65502e3f73412f29df790b658770ae027479ef23b7b7ca4e143722a +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb4e6dcc35078fb589c0f25bd329f13c45963f38 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef5266742b909f0c43d820155ea13c4eafa2fe727dce33b7318b9e61bdcc7c7c +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a76415364d131c747c19cd642e0a95f9b74cc9be --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_91_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b13f717ab4b4b77b46a0844d1b14a1cad903badf97c3a1d9ed75f23ee1ba0e9f +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52088f70cee64190477e01cc0107eff4e01cb01e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_91_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44227528f390a6aa6b1d87213c694745e581f00c18716e79e14ac2648e8ad227 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5de2907837b9553155567d3467c4d3b9270cc88 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29b0a04b386e6ed3ee34068778fda52ee31d04d794d1526c12d8f254a7096f45 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5de3f62d0641e0c9206bedde0271ceef59eb4989 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6b76f912eb10fc48b66dba361dcf4dce201de3f0e0601c1e5e027b498b76a2b +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eda2f1123ed82384ca3339ffebba93712c6c8c4 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_92_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54011a115bea619b520379d1cac4149bff58633cf2da874af4a0820a0f3f7a93 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96c30de0efd00f3fd2dfc1dd0fec9356be500b51 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_92_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d16526863b6cafa64cab27ad14a84ad96094ca87111702c8bcf1180dcb3177a0 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ff0db1dfe4a859a6cc5944f36ff4e853ddd099b --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2c0a64f4c75bd707f922a32b0058effc0f2a24d2962ecdc57b338bfdef2516b +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0e9bf21790b81108ec38e1437c0ebbfbab9cf52 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fb13c56351ee955ea96921a31858a2afc8ada0c9c5a1c5de89984bde11bc058 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c492e17fdc3b5f43ca8ff00ac8232a0d913da492 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_93_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa6b46e05ee6805154732113b2a72b82ac34439a70ab50068e66b24aaa6c7bc3 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7214afd94161434d751cc9026c3ae552d2621fa --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_93_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4c83245f9b8bf3a0b5c7eee8517d9f180f6554116f943be042b62ab949f8d7e +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9be45e5d39e09cd487070b7eb4d7914240447bc0 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6977fd61c50628558c6da0c5902983ae06f4c717173f7e3b50ec02ba2c6c8f5 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d504ae62d9c17cffb0e1fc566282f0c1b681e0cb --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0376212fa8088ec11597192969c3d1a7967b103490555f2da63362dcb3b210c5 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fce01e3bb10266c36114935f29a6a0f477ba64eb --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_94_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:587bfe21b73929c8a0f0a9ff24140c77394b491fd1a9fa6165c91558c786e9db +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7e48b312ba0871740a220099da4dde5c8054489 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_94_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44d6a1d4f4f65b574093089ec65513f15234044982886ef817ea3632b2b980f4 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a6e64a590581f6320221b7a55f723bf016d21e1 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7abbb325ed4bec5597769e86047532e2eda0b1e47b8dce46d82c859a1e4b2d06 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0885b39915a44c2c22626635f4328a707ecee6d7 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fd4dee967bd618065fa1fedb279c017353ed5c619e2378197b3c98e79c046e7 +size 208731490 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79dc0ffa8fdccecf80c9cd120ecdfedf78810d78 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_95_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4e669b3092b193f5c002701ee955921145dca3a2fce1314539721402a77c2e1 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0048106071cf7f1c479c5c587cb4c01e73f7e23 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_95_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db8f797bc8fa522046c2e90d87b638f30ce20284a5bc981555da663606191de7 +size 208732258 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65b3d82038194e3b88ea8bfc608536862a57b5da --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:943268640a62f1004a39febc7c597c8491ef526c22b72afcb017d50f54bad2d9 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7930b30124dfd60ff314ed3c8108fa274ea66e8e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd3e7ee59af364d9c1487ad5aa6dd6aa6fb515e4377a390ad5c66158bf78e98f +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7b871f715ab57d0f1deee55e58f9cd1efc05dc4 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_96_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:672d06b3122770e4d05bdc12c607be089abeabe85eafed1e35e2ec402854a163 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c845923b1d11cf3c827ea5a318d6d27a6262343d --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_96_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86332ecf943086314116908a43231bcc1c951bd5e9a59d0531abbf8b8415f97a +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08732cce092714ab386fd5b769e935cf74235af4 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fff43c4b08fd221bdfdcec5745eb221522ab1d5158e6ba31d32660b822cd24a +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47e6a480fa39d61511caa51c726d9dc332264ed7 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82ed9afe6ee67e35cfcacab7ceeaa722e8ee0f0c282009fc37ecf6847e134108 +size 208731298 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9a743e1f17416b3cef4398827c556863afea1ad --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_97_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba2d8ed4c97d1b27ff07bccfd7f7e9597ab614a33c7e2d88bd6781c81458ac27 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b80b55ac03dbf6822e4f47f567cf64ea95707a3e --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_97_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0458d11508bb50d05de124b6d33a75c935203826fddcd0edc406a9316a5c259 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cb9df08f9ec2945859072cb148defc975166b88 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb61488ca6437c0a02802eafe4abb015622f0fcfb1c6d1667e5cbca435715617 +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20dac60dfece8ff2d91e92a28ff50488bcdb6b71 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a8b757ad7a912d3f27748dafd41b85257dfe2517bc02f4a4c7c8c1230995eaf +size 208731426 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5feff9db53cfa8588aa733e46f06b3d7ec8a2515 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_98_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd557497941fd259f90f3a5a79436546c9efbd02b68d9b13f6428d4b4fe837ab +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da9c49d9dab5cf19877a68ec91903de8ea8f3934 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_98_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c0407854f787787aa8800675e9183089f1ca735277d2430a6a5edd66541e2a4 +size 208732194 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be88a6eeb19aae2be38eda85479ae99c947268f2 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39e5af67dd39ab64fdf6474736aeb68fabfe4144f294fde79837a46c512e0479 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8011f93bcae95c7772945992da87eedc21dca3aa --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:516b48dbf485578844aad6908988ac21cd0b3a2c9c1e51c9e7465614ee9a9e12 +size 208731362 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cb971f3bc8ceb30f2c5548e93eff3d247c61463 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_99_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cefcf19009ac5ccdeb897011ec90df37c66c9ac265e4e50ef69aad8e9e9f420 +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67021e2520169d8da27bd9adc73a51523c620720 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_99_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0cb1142d5009d4c8b4c3142403ba8b775c10519671e5ea780c908f86aad322f +size 208732130 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5053fd9d2957a637ab72a7defd6454d25ea81ce8 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3abf76fe1f502da9fb7b461e04248a86c449ee1fd130c26aad2b4ba56a394c8 +size 208731351 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5939d745019f9dc167f81a3e86bd54eccbca2b4a --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd02b4c22bff6a862b3f9107cb415439c34ca71c51584d79beda81bc41039357 +size 208731351 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e88df4aa2f5c5ee8f3ae7e40f91ef39ab9fe1707 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_9_mp_rank_02_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1b757ad313f25be7801f8db69f2b1e0e23940a8c301605531d24ecd26dfc1ea +size 208732119 diff --git a/8b7178b25b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt b/8b7178b25b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de52988da51b32f64fe654e209c65bd16f1a1649 --- /dev/null +++ b/8b7178b25b/global_step84877/bf16_zero_pp_rank_9_mp_rank_03_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f065fc1785d5c59ffa6215c4893c250533c45527f21a2873dc75eb1e9b14ed9e +size 208732119 diff --git a/8b7178b25b/global_step84877/layer_01-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..566e99cc28a5d9b63c97544ad5f178e4dc08bec6 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:348f17278c8ab8729924c6063bd16ad7db393658ae068882e84c822081da2a73 +size 223347971 diff --git a/8b7178b25b/global_step84877/layer_01-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a92c6568d324afab143039b4dbe63bf451028bff --- /dev/null +++ b/8b7178b25b/global_step84877/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ee84bb2c68c1909818e73d2b8fea7ec536bc57194488e4a70ccbdcd4c60ef8e +size 223347971 diff --git a/8b7178b25b/global_step84877/layer_03-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a6a8516fb5d8384ab5c453f777459a180f8d0d5 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f218ef2147159861f8e5ddcbe104b5889ae6c8aee3890ac9bb477b5e2ad390d9 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_03-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94e3b55f21c4215322c4d985d8919ef43018b4ee --- /dev/null +++ b/8b7178b25b/global_step84877/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7df9d3c1fb2edb9328b8f5487cb8831e9c9d9e74392f0f89f4dbb98712193cd +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_04-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1016cc674eaaba4cf1b2071ad30ea10b1a8b4d5a --- /dev/null +++ b/8b7178b25b/global_step84877/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddf6a84bdfa21d3ef32c9d79ed6de450e979199511e1bfcea9bf1c7ed1450ce3 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_04-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..699c24d1be9f477e0d9f1d0a41facbe126c75606 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5521c8cd69b0ece7cebeb12aebf2512695fb465b147086af277777960579082a +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_05-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6fb884f705bcb8e9e73439fdab1f5cd038122fe --- /dev/null +++ b/8b7178b25b/global_step84877/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46662b3262395bc04940db2557d58a91abed1e6ed3c982f41eebe40c768313cc +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_05-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a730e1e3f0978334af23520bdcf60f3fa381f4f --- /dev/null +++ b/8b7178b25b/global_step84877/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49e88fba0d447e5c7fe113344479a8ad9544317cbcc2e1d4f65fc94a9e2f662c +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_06-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae7b86609529ebd57a7be84d0108dd74cf7a0bfe --- /dev/null +++ b/8b7178b25b/global_step84877/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dfbf1383ad598cf8718be0e26aa60373d4da8cb60a6501357fa216e763105ef +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_06-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c390a6ca47e95b9baa5fcff4d59f2fdaada743a --- /dev/null +++ b/8b7178b25b/global_step84877/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad70e97b1fff878962648b3350d27eb43daeeddf07857e6a300a2f7c862d30f2 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_07-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbf6e360bcda61bed75ec8b4b85c749565fc258d --- /dev/null +++ b/8b7178b25b/global_step84877/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19127ee57d56d4a9756356900e341d662658f00663f5c8d442e7ca13401692b8 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_07-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c12c463434c460e6bd5081cba87a06dda55d700 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2253fe2074dba1df7d9865e8a7985fe93d62c420396fd0831f6f6285e879a7d2 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_08-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac697d2a9272f275b937f288c04de696f8a7113b --- /dev/null +++ b/8b7178b25b/global_step84877/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b25f8fc43b4503361086a0998d1a8aa50e1d7f2ae402424fc8a74885442cfcfb +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_08-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd9c9b73ad971aad7c92507c60fa29c5c373a9b2 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffa17dbda2b7a93ce4e654dc9a029de2edb5e8e46ecb30fae4b0e8dc7b781b00 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_09-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5734d91dbe4e7b037b29d04aed810008d617cd1 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:887216340d165dff64401e6af660f0fba323699bfedd1ca4b28710209ef1fc44 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_09-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e7eb323f5f4c24983320b84f3a5d4867f206baf --- /dev/null +++ b/8b7178b25b/global_step84877/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33b8e1e46e0e5bbdc1c67e6dfa84bd6709957079d971ac87b9ae9e2d2a97343d +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_10-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6e563e23cd8474b1df7af1409d8733a4333f500 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99b19d0151d2110bfe6bca3dac84e4b07158ba4ba3133ea17644e2b963c1bac3 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_10-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f18ce18ca935b832c0e3ba4adf47e776a7ea0cc3 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e28f66d6f9f1f8b6e4f932ebcb8d2832c1772a9a6420d9169d4f462b8e706eec +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_11-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5baa4bcb3f4ca36613a7b7b0364c5911daee04a --- /dev/null +++ b/8b7178b25b/global_step84877/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08de3d5d7f1c073874e817b5fc9fbec1b09b2d656aabb66a58c04b6699aaf188 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_11-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf826341766aae42a05e6b4ae0103c4863af9e09 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e00076df28fb278392baa4814b415b8474c9b36ca0f5e23c9a167a38331ce95e +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_12-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28cf876b264b1420c5b6c85228a71bc99172268b --- /dev/null +++ b/8b7178b25b/global_step84877/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fdde17ffe65ed541f216e700aa3b30048926540425d74cd0ba9f2908c243329 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_12-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a06bab465d98a88c164460a8b76b44a9422a199 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4413cfded0a873b1f625ea133047671d72ab99c939ed3afa35b876a39f83dae +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_13-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc452000deb38f50dfc957461c047f232c765a8f --- /dev/null +++ b/8b7178b25b/global_step84877/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ed17e9be16f52112fa170410e64d39233a5b23b994190a2597a87c9f23d9b18 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_13-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b3b74f86aa1c31e7ecd38e1580b3a36e9bea410 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e76618b814d00a4733d64c2fbf6fb10084e9c05b04be37581d75a54abede54ce +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_14-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb76dcc4668dc3381eed259761567cf42d9a2bde --- /dev/null +++ b/8b7178b25b/global_step84877/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d7a1d8df1a4e73f2896f775d4f14fe47688b7b783faf827a8cb8613daf6c707 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_14-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52b21450c99a7825e86765373eedc1cc7f90c88e --- /dev/null +++ b/8b7178b25b/global_step84877/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:816de7021bce1cd55a51f64ee9407fb4cfe8cc01b0ce538ba1a0d16a171e2aba +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_15-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea148c5a25006571160354f975a881df65e28f12 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25cf16a15f86cc237c193db3be284d8ee7f3ffa647b06d72615e90c0fd4ee036 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_15-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b77a6f0f3b7f5540aae65339202848933df37d02 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:136d66a9a50cb6e5830616868321a2cfeb7030b5bacac6e8129390f54746a030 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_16-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a29c5fdf64dfae7d97b75f25ddba00e572b5d140 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3b3a2dd8b9af8ea6042a3573552543dacabfca39e64daf11c2e7e20e50183cf +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_16-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0020334eb97f8c664ca4ce8692a465333448e8ae --- /dev/null +++ b/8b7178b25b/global_step84877/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f8424cf9dadde00da925bbd7eb2f0ab6e137ef30864e9f47829b1476f0f458a +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_17-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9aecd9f468362651f5cb9acfa3250f8d62e89e26 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:017184106525071595ed50171f9010d09220f72178b05acf9872dfa662a54f5a +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_17-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea19fe552d9e502a6f5356a3e097b70c6b2d1fc5 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3de1a437b6b7daf68a95be96857a9209c5fcd51d7ca9c84006521b34010bb2b +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_18-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..694db053577c5256201e78189c38b6a035857a3c --- /dev/null +++ b/8b7178b25b/global_step84877/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ec498c4207ae64dc5a072a35e80675c98f280de0f2a222a8316cb10a5ff022f +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_18-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91c4688d83f9456b184ad3fe912a71a448b5ea04 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29c3ada6a6acc9707003cc92a7f8704d4dcb8af1ac4fbed28e90a8178eb0daa1 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_19-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3982961cce4b3c66991058959babf5b6152ccb34 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b2689576ca7e6e3bd98b503582e519407493e9ded50a02e426449fdeb0e1a40 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_19-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c61aa2f25b2619da64cd1f06e8d165391b153463 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0332d81d6d44bf9498124ac4a5efb39c40ff147a2d9673255a341ddd9454867 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_20-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..070392e83c759812c7efd0c790f4978632745dd4 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e5406a994ff1fbf402bf843dc31241deeb1cc935fd1f3afa3302b0e6c8cdd30 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_20-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c04353118eace07838c82a9e4e9447398dd3f28 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e7569c4412e5a132b016b571efeacc493ad5a36231de48bbda037f064152eda +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_21-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2189f500280d5631a7938d042f8fd4ed92d3a54 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5466e8d8976afea68830792362c9917a0d5a5e334000b94dc7241acf6def3c64 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_21-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9917ad87c221a08e545177da26d2c63c615d54a --- /dev/null +++ b/8b7178b25b/global_step84877/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea501e559382dabebed622b7652e94d3e01226dcb60af3f1955192cc6f7e65f2 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_22-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..465038c08ed822c8c7a03e1bb043291e03ad4879 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ee1871dec31ee442a3adce63aeffa4f0ebfc28b0a6574ca1811919a44db28d0 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_22-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0a2d814482d8b5d1beb6c5c5ea673a44479dc3e --- /dev/null +++ b/8b7178b25b/global_step84877/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ddb9067bffa921ba238ad2736eda37e92c972adcee569f9d97d15561802a354 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_23-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2ea56ab2bc05633c762f59f234f37dc7b652b55 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46fa41616106d8431a997f8b76bb07140de38c0a1b4ae2cb74bce96ecb7f47f0 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_23-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f27c33fbf00f89281deb5456901aad1b109f9576 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8409444d93be7be55c8908e28a5057a4283d2de90c975299a096e26e116dc626 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_24-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5166c731aa0c8ca5018a91344e8ba438213e3312 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dda5275a8a844590af904cc45421eb2778ef3ee93cd4bb97e8cfd9707db40d5d +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_24-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfcb8f90144cc2d250ae0c1a1c1fb46c274cf3c2 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ddfaeafa57f19d09e7f1b60a9b0a786c7ec6172e9e25a054d0bea5bc7f287b6 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_25-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3a76779c87bac57d86225ec8f2008fc3d548f2c --- /dev/null +++ b/8b7178b25b/global_step84877/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dfedd2a08e743766b2899c8b79065ec0c88653dfb451f775a921392b3f175e2 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_25-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec6e6fc253d3bd87f528b9307f7916ec83fc1aae --- /dev/null +++ b/8b7178b25b/global_step84877/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73c1429fa6b277037bdc54299e6e5573fe1ce77065890f602336846108111607 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_26-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3acef167a99e2e6d5b9fe13c88dde32b564452c2 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36f030ac6a12180cbcd592568229b5d60a2d990f7d0c9893a26524ede04e44c9 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_26-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d456fe1f57729fb7e79243bf0f0c16f145ad92e2 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9ecfad8eafbc252f9af958b1250d4320cdbddb459b295477409788aac8044d5 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_27-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d655ceab8995ecd510e884ff2317764f7216a2b --- /dev/null +++ b/8b7178b25b/global_step84877/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:356d4faa6a2899f74c077365f1e2a43a76b112d70995c6307f176645879923ea +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_27-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1253cbbfa2f73a9061d845039ca92178f547f166 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1139237730946c6283d7cbf172d71f449d984db58c3421b6d94fbc689b1660cb +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_28-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40fd8d6100faa0228112c0ff87aee4d24cf41ba6 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2064e61a1555d35508a14c60c0248d8c3bb4e798af668b4f2beb4a6884f7e16b +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_28-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7f35604a99f42d3bc9bea146831428bb960e16a --- /dev/null +++ b/8b7178b25b/global_step84877/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8727ba21b1decc49cb8a096ebf4b4bf4d03509bb41ce866ef60c6d5b18cf9c9d +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_29-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62c3cc6e6ea1350da6f1ad5fbe58c8b7a17c1a3d --- /dev/null +++ b/8b7178b25b/global_step84877/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2214d1d9dcd68fde56f36b25175a4566b3b514db659b5cbb00710c09929f4ea +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_29-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db61415b4bee532244aa1a7f321effa81facff7c --- /dev/null +++ b/8b7178b25b/global_step84877/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35e4ab69a2e8b28b0574bf609b3e05a88ca5c206b3181aecc1b2feaed09b4c65 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_30-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e6f5bbcf1279234aa0243c6798ad70d315f0395 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4719873709280127a5a5ce85362e965dd12d6670bbcb554ef09c57f7ead60c4c +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_30-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49c8e153813ab9463eb7853259687cb936943d85 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a0d0ef0870eb0bb7682a0da0c6b4f6ff1cf64bb41ede0a199dcca28c986f821 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_31-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39e12c0190f7bf03fa4491fc5aa9e464ab85e512 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eda0776d127c353e162c9ddbfce88dbdf7cee7567eb94596068b31cbe2257d8 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_31-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..631d6dfe7fc0731e8a1d620a254465532902d3dc --- /dev/null +++ b/8b7178b25b/global_step84877/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:771f31d9a06081c5148647ea91c2cd8a5f960090cbae8b2360c994b1488327d0 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_32-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aed40b88998262cdf2d86c7b538b1c6faac0aca --- /dev/null +++ b/8b7178b25b/global_step84877/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c281c8fdc798122d4d6923a0bce7636634ee3ae0d80235f96dd65c7effbd4fc2 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_32-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45135cf0e0b962455b7a6bd1417486d9f9279a2f --- /dev/null +++ b/8b7178b25b/global_step84877/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c903f5b0757a5a30e2dfeee05ffa3162cf149def2a910ed419d89265d8bcfd2 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_33-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ea348a4242f26d5256ef449279266cf319cc116 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5202f28c4fdad42c1a3d0b44e95b89530a64b48299109fb6293b3f10b33421df +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_33-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e358cc0a931634cdf3cdff4e9d31f16e8abccd5 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f9c76b0335d5b7443068a0f357268c786ec6babd899883938bcb605ebeaa57c +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_34-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4d7d9f2a6e196832a26381441b347528b2bc59b --- /dev/null +++ b/8b7178b25b/global_step84877/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dd3bb5c0e9965de65bd20a330cc1522c5ef8432e41b02d1d0851cea196f0c6f +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_34-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f315a1e313cf4c9f9d758ca91292ac5634ab0785 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a54ba8e48e23afe0da2037d97f4f70c1ac1e9b88bbd534f5bc1adcba4e815c92 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_35-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cfef9b71115439874be84e707a603db3fadd50c --- /dev/null +++ b/8b7178b25b/global_step84877/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08ccb40e84dd8f7733ea0ad55f21fb919aab47e2a2e1a4e0d3dc69a92e8a0f5d +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_35-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..878345bfa36bfb576d1c118fb03dbf04898fdba3 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a23f3b2bac1971185c6c50c2b7ca5d2622dde3d95e1b424fd04ed4981698392b +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_36-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ea47e7d893d1bd9e642a81c0528297379394ec6 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:149b8e8ba304a788c040567c74158b5feae583d02ffa1315f6da35ed34540be1 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_36-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89cb8014c52d036f975ef9ca8a669edf85ab6b3f --- /dev/null +++ b/8b7178b25b/global_step84877/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fade2902be655a3778b53e3993bafa8ae0a874be460d24737b208190b86bbaa +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_37-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..594bb0786f079830b84756e47477526a2e5930b4 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:578bcb4a6d35ab9eec6d62386b139361f26f1421df5b11c43baea9c4edb3baee +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_37-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..675571106b6ad9a5556fef613749e21e88bc71dd --- /dev/null +++ b/8b7178b25b/global_step84877/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4af0fa408322e249387a416aa1e86f427b0d5cc39b1289fc3cdeb4b35d7faccc +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_38-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ff4237f987445a8d175b620ce5c0a2f3a94a4f1 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fdc50d7b768c22800ec019745dddab17baad375868e9e4dd46aa73045ab2df5 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_38-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9875949f8f0b261f94cc3a1305700c3c58d98ef --- /dev/null +++ b/8b7178b25b/global_step84877/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab1759b583b33e6d235a0f7b98e35e783248c07f767e71f451f31d39c7454855 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_39-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_39-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7417211f7414afd252475af3719a99d569975d3d --- /dev/null +++ b/8b7178b25b/global_step84877/layer_39-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7ad7a3aa08388ee7b6460f7a0444ff30cfc22ab92d9038f2820857b4a8d59b7 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_39-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_39-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7f9562ca43a2a65c61ddd688682eb15123a2b0c --- /dev/null +++ b/8b7178b25b/global_step84877/layer_39-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1495dddf7b3e03188b307bcb8ad556fc99ebb7135ca7d2e4144b9fbca43440b +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_40-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..374d8cfbe8d13b83e7d7517a0e82c103e8ff61d1 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28510cc62a1d09779d5db16f32c3024ec676a3f36f878249c96b1c0956ed14ef +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_40-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2468af7e915a329e686d140e3885264bbb30d05 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b372f4f039ae59fddb55b01e99be4172505c2281bdbe47b6e0bf2e5d25385b4c +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_41-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_41-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00805a80466631c902921818d7621f2f70d56d0e --- /dev/null +++ b/8b7178b25b/global_step84877/layer_41-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03f30da1672478d805c6248db9ad132ae67fcbcfc863ac5989bf41bc9097f9ac +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_41-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_41-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eac344adaf55ada622ca531f56141040bbb1885c --- /dev/null +++ b/8b7178b25b/global_step84877/layer_41-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a17bceea640cb0ec8982b172b2eaeda2a823ca5e046f2fe4681756d14196944d +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_42-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_42-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9879255a8b0ffa02fbef58206a1c3415535bac7d --- /dev/null +++ b/8b7178b25b/global_step84877/layer_42-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2e2d9af066eba2554af3cdd0179ef5c98e629b75ef65978b8ad8026a4b2e5d3 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_42-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_42-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c932508722a4984c51966322481623f477d19291 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_42-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c996e9c907dd6aa2627b75cecc127e533d421d867db3eee62390cbce2a937976 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_43-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_43-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..090dc3a68574f0d26a493b843c2f5965e922c011 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_43-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:181b9b8b4eb7db1dae0629fe63d5adfc0d39d1218ae0790d65ac4de1de949c49 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_43-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_43-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bddbbee2e19edacd2157f3ff4dd390165f581c2e --- /dev/null +++ b/8b7178b25b/global_step84877/layer_43-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb74b3cae37e9640596c3d1309eb919d7e4abb0a9f67e5e9c3c28f555ad2cdf5 +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_44-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_44-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5ab328b3b8579646db473d9bdadb16378547442 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_44-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c20a31ea7638b5ce98b7af599379b3e6935ae0e7d794abc783467b67ee793e2f +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_44-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_44-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5df1af8923ee564983e60728e7d218ac101a9340 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_44-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cb2ec7548670ac8fbbdc41a11fccbbe65b51ee1f7fdb57c3a4e773ce9c1236d +size 201408771 diff --git a/8b7178b25b/global_step84877/layer_46-model_00-model_states.pt b/8b7178b25b/global_step84877/layer_46-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..520ed601f99e44064771e34d73e04a87a5ab0f0f --- /dev/null +++ b/8b7178b25b/global_step84877/layer_46-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:551907871c62ff61bc58ecc22c8dbced9147dd8de18427ad98ca3b648031bd89 +size 17603 diff --git a/8b7178b25b/global_step84877/layer_46-model_01-model_states.pt b/8b7178b25b/global_step84877/layer_46-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df8f868c33f2b424989122d2a45794a4ffbf03d6 --- /dev/null +++ b/8b7178b25b/global_step84877/layer_46-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00fe7c8ed5f5d62baf17e04db50e3d8315202d6a5e64901b97df19638dbe9ce7 +size 17603 diff --git a/8b7178b25b/global_step84877/mp_rank_00_model_states.pt b/8b7178b25b/global_step84877/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..748e7501ee4c282dc15e95423c6775b9a32e2b12 --- /dev/null +++ b/8b7178b25b/global_step84877/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60b73d9c333ef08791da4eb7b38da77f664ae1a536b73cef5774a9b97ecb80e5 +size 40115 diff --git a/8b7178b25b/global_step84877/mp_rank_01_model_states.pt b/8b7178b25b/global_step84877/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f675b52f4c17c0b2ced1762019e66c96376a236 --- /dev/null +++ b/8b7178b25b/global_step84877/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c00606e92878aad8b7779a79a6b4cac86da7bbde1ef98a28d157e5afbae1243 +size 40115 diff --git a/8b7178b25b/global_step84877/mp_rank_02_model_states.pt b/8b7178b25b/global_step84877/mp_rank_02_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3f5ae98b03d90439a62cf584852c476c8a7ea1a --- /dev/null +++ b/8b7178b25b/global_step84877/mp_rank_02_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66e4f63cb47ecb67e642d5458118de61e65c93a223ae57cbd3d0d1a2399eff40 +size 40243 diff --git a/8b7178b25b/global_step84877/mp_rank_03_model_states.pt b/8b7178b25b/global_step84877/mp_rank_03_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ab3558c44c5c48de99c3ff0fc6fef22674a927f --- /dev/null +++ b/8b7178b25b/global_step84877/mp_rank_03_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3389a2ecff505a878426fad96c5ce69c68fb2d14f4e00a713548a9da37f77b9b +size 40243 diff --git a/8b7178b25b/transformers/config.json b/8b7178b25b/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eadf3eb13cecae9db1c34cde4f4d373a9d0fe00f --- /dev/null +++ b/8b7178b25b/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 4096, "n_layer": 42, "n_head": 32, "n_inner": 16384, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/8b7178b25b/transformers/pytorch_model.bin b/8b7178b25b/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..0f98b2f6fdc4cca36dd8e74b92e6a44e4df7d212 --- /dev/null +++ b/8b7178b25b/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:103da80b4f44d89e90566b3754656319a1f0b261b5ced3ee82168bc739aeea02 +size 17698351197 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674481125.nid007138.60152.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674481125.nid007138.60152.0 new file mode 100644 index 0000000000000000000000000000000000000000..741c0387d5dda99463f690ba899d7e0277bd0324 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674481125.nid007138.60152.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e39184d4efd5a528fe05dbcf49602e7e1d2aa6b9968c32a9f6c38f468c9a0efb +size 19657 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674482012.nid005934.127470.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674482012.nid005934.127470.0 new file mode 100644 index 0000000000000000000000000000000000000000..d9d1e2ad184526775975314d5989b185ddbd3bdf --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674482012.nid005934.127470.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa412ea05b676c4a43a96f0ed29f699b522594d436a54bf7ea1957c67671ddfb +size 19657 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674482459.nid007138.74648.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674482459.nid007138.74648.0 new file mode 100644 index 0000000000000000000000000000000000000000..b92cf296931c5314bcd85959fe7a0ffbc7fc4d68 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674482459.nid007138.74648.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afe6c1bc332070df44c27f98ac2e7dea3025191fc6771f6178629d2a5eba314c +size 19657 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674483404.nid007138.86386.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674483404.nid007138.86386.0 new file mode 100644 index 0000000000000000000000000000000000000000..a28be2c950142b4147678da930def08645d99858 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674483404.nid007138.86386.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31b6ae2046b3bbba73c4120e44dfb1901457c297f9a65b92c3693195982ccc8d +size 19657 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674483837.nid007138.95299.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674483837.nid007138.95299.0 new file mode 100644 index 0000000000000000000000000000000000000000..b4161db3c6cbffdd22e7a9fa3e46b1551813c7d9 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674483837.nid007138.95299.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b76f3f5e6421c993cff1f9511299aaaf55c550e85315e72ff9ea2f2def5a56a +size 19657 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674484342.nid007138.102785.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674484342.nid007138.102785.0 new file mode 100644 index 0000000000000000000000000000000000000000..9ee45d428a58061a790854f86b828091c287e237 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674484342.nid007138.102785.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a7af8ddb752192e14135595bfc38a2256d562ad4d21bfdaa9685b61bf50d561 +size 40 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674484803.nid007138.111853.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674484803.nid007138.111853.0 new file mode 100644 index 0000000000000000000000000000000000000000..bc887fa3d70c5dbb35f664ed303304d7f0cdbc00 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674484803.nid007138.111853.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62a0caae97cbdd2b87a5991f729c7e6cd7c135fa7285bf2af6fae7e7a7908882 +size 19657 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674485222.nid007138.118724.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674485222.nid007138.118724.0 new file mode 100644 index 0000000000000000000000000000000000000000..0953e92f2931c98de88124fee02e8523887a4071 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674485222.nid007138.118724.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee68ab53fd381f8c57aa01abc24a3130f9be4ff25f323624bd0d80897a22452b +size 19657 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674485685.nid007138.127860.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674485685.nid007138.127860.0 new file mode 100644 index 0000000000000000000000000000000000000000..abd4aaab721dc6acc40049cfa187e8fd6453c892 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674485685.nid007138.127860.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d24bd953a12053345328f85b74b4233f9df2f96c792134db2901a5bbad9d1660 +size 40 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674486126.nid007138.4834.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674486126.nid007138.4834.0 new file mode 100644 index 0000000000000000000000000000000000000000..1a08690a77811d670008884e3ad14c81b9c60b28 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674486126.nid007138.4834.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a69d9f0a3f0b0babd00a1b3e3c600f63e5de7dc29c4270d7fd45b44fb2eb021d +size 40 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674552890.nid007129.88213.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674552890.nid007129.88213.0 new file mode 100644 index 0000000000000000000000000000000000000000..72126e84947b913984e00dfe1fbb20d7e214545b --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674552890.nid007129.88213.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5497ec74175485ea1b05cb7e6e7be47dc0a5418233c16832fd6d2ae3cd9812ca +size 40 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674553452.nid006981.92902.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674553452.nid006981.92902.0 new file mode 100644 index 0000000000000000000000000000000000000000..3a0844aa3a0bdd66ad13ed24bb0d8d40f75e145b --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674553452.nid006981.92902.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4354fd5c26c9c3b20130544340e84f514460141c235007cf94cbb55bebe1bb20 +size 28658472 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674642972.nid006058.116038.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674642972.nid006058.116038.0 new file mode 100644 index 0000000000000000000000000000000000000000..32469b2a169f2237430e56125ebd953513b6763f --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674642972.nid006058.116038.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fa1bce5ec578266213d7f586a6786523685d921dcd26d45b04a852f70c9c9da +size 40 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674643531.nid007225.126533.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674643531.nid007225.126533.0 new file mode 100644 index 0000000000000000000000000000000000000000..90319c89fc9a8813082fe71670133f825485394d --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674643531.nid007225.126533.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56c81fdb6540eef02f9bc233223d85689f3ad0847a3fd738745a572f8dcb0595 +size 11977065 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674759529.nid007191.89290.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674759529.nid007191.89290.0 new file mode 100644 index 0000000000000000000000000000000000000000..58ac3c0fd5f60c6002f6c6b7344ee83ffac15458 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674759529.nid007191.89290.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f5e8bc21519d700090b8083d74eeb6c21fa6e8312847e6c632bc2d8c51d2f46 +size 40 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674762344.nid006210.96546.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674762344.nid006210.96546.0 new file mode 100644 index 0000000000000000000000000000000000000000..79dd17840af383cc9209f523b6f8681bd292bd51 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674762344.nid006210.96546.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f27e2812f2f4c6404b123c26d89308ccb5a332a7bf0cfcc38247f47f68c2caa8 +size 63358 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674762802.nid006210.105987.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674762802.nid006210.105987.0 new file mode 100644 index 0000000000000000000000000000000000000000..5ae7fa91b296a0bde0a3e8cb5bc458533e2ee2e7 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674762802.nid006210.105987.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f925e3ace78b86215b098dbe0f8d439d835a91df855788099ecb763f5fe310b +size 71953 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674763290.nid006210.112440.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674763290.nid006210.112440.0 new file mode 100644 index 0000000000000000000000000000000000000000..0d7957f55766cd80fdd89f65a9a37b269ad2b28e --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674763290.nid006210.112440.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39e1925f795be604fcc9628a767ffd018683e893501b6957e62893a28f559585 +size 40 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674763853.nid006210.121919.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674763853.nid006210.121919.0 new file mode 100644 index 0000000000000000000000000000000000000000..ce484f9e32c19030b779c9d5de25ab6f6776d210 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674763853.nid006210.121919.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e65e94c0e15715d71cf32e53d8492b642082b07c14d35c937889f7da8998f79 +size 40 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674910928.nid007049.6996.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674910928.nid007049.6996.0 new file mode 100644 index 0000000000000000000000000000000000000000..064793c33ee1eabe816fedb9f36ea94ae8b9c443 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674910928.nid007049.6996.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3933d64216a2023db9c1cce04fdabaeaa5a30144bbfbbedbf5eb5d7fa8a59981 +size 5459509 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674948891.nid007035.116321.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674948891.nid007035.116321.0 new file mode 100644 index 0000000000000000000000000000000000000000..fc21d4d3a397f18f628a952c0970cb8ee3ba76ad --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674948891.nid007035.116321.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c85f3cf166886f1a178fa7c8a142856d324f3a8349fdbb899555e8d914e53f4 +size 40 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674949340.nid007035.123028.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674949340.nid007035.123028.0 new file mode 100644 index 0000000000000000000000000000000000000000..77762bf541fd2cb597598bb3f52635670c3aa0ea --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1674949340.nid007035.123028.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d4ee7200d397fa2c4fcb77ab3f5b868f95131123202ed0ca48226eb27d05417 +size 55702927 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675122395.nid006789.62590.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675122395.nid006789.62590.0 new file mode 100644 index 0000000000000000000000000000000000000000..2fcd2a1b29321e29c0397e4f78705179fa132425 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675122395.nid006789.62590.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d17d8f817751a136f5fcf805dbcba694b031902adb2e05e5ee545b021aa2a3 +size 54019578 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675295173.nid005100.63633.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675295173.nid005100.63633.0 new file mode 100644 index 0000000000000000000000000000000000000000..9e5fd8a6ae5c8c9e8bf02820f95d503891750e11 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675295173.nid005100.63633.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dbab32fcaeb31b83c039a31bce1891e2cd92aa242c5a6573bb68d6d32ca3883 +size 40 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675295804.nid005855.109023.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675295804.nid005855.109023.0 new file mode 100644 index 0000000000000000000000000000000000000000..80c8b40e4b0f5b042fcaa75cafd89581bb89f4b7 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675295804.nid005855.109023.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ca91c2a4fc17c7068c32e62f26dfac64f3394157564a3abee4473a4d3fd7749 +size 8794719 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675324203.nid005100.52401.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675324203.nid005100.52401.0 new file mode 100644 index 0000000000000000000000000000000000000000..bbc1a439af5d526a5cf7d98b156c83337964e3ca --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675324203.nid005100.52401.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1ef972680ec304187cebbf6176c37b8dfa858c4570b8f5c99401d40a19353c4 +size 40 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675324824.nid005100.59528.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675324824.nid005100.59528.0 new file mode 100644 index 0000000000000000000000000000000000000000..4ffe68082889db27f1b6f077fdceb014f444cbbc --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675324824.nid005100.59528.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb842ef2fc91a1dd035fd6d430f9af630c57fb9824b9462a1e19c27ebae099fa +size 40 diff --git a/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675325429.nid005787.81891.0 b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675325429.nid005787.81891.0 new file mode 100644 index 0000000000000000000000000000000000000000..3843f0eb45609efbef04d9abde5d9b9370601fd2 --- /dev/null +++ b/tensorboard/tensorboard_8b7178b25boscar/events.out.tfevents.1675325429.nid005787.81891.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d2da27be94615eacad895776edeba6f2198f6dad4565a612fc604b8feb5c848 +size 40